1 /* Implementation of Fortran lexer
2 Copyright (C) 1995, 1996, 1997, 1998, 2001, 2002, 2003
3 Free Software Foundation, Inc.
4 Contributed by James Craig Burley.
6 This file is part of GNU Fortran.
8 GNU Fortran is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
13 GNU Fortran is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GNU Fortran; see the file COPYING. If not, write to
20 the Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA
37 static void ffelex_append_to_token_ (char c
);
38 static int ffelex_backslash_ (int c
, ffewhereColumnNumber col
);
39 static void ffelex_bad_1_ (ffebad errnum
, ffewhereLineNumber ln0
,
40 ffewhereColumnNumber cn0
);
41 static void ffelex_bad_2_ (ffebad errnum
, ffewhereLineNumber ln0
,
42 ffewhereColumnNumber cn0
, ffewhereLineNumber ln1
,
43 ffewhereColumnNumber cn1
);
44 static void ffelex_bad_here_ (int num
, ffewhereLineNumber ln0
,
45 ffewhereColumnNumber cn0
);
46 static void ffelex_finish_statement_ (void);
47 static int ffelex_get_directive_line_ (char **text
, FILE *finput
);
48 static int ffelex_hash_ (FILE *f
);
49 static ffewhereColumnNumber
ffelex_image_char_ (int c
,
50 ffewhereColumnNumber col
);
51 static void ffelex_include_ (void);
52 static bool ffelex_is_free_char_ctx_contin_ (ffewhereColumnNumber col
);
53 static bool ffelex_is_free_nonc_ctx_contin_ (ffewhereColumnNumber col
);
54 static void ffelex_next_line_ (void);
55 static void ffelex_prepare_eos_ (void);
56 static void ffelex_send_token_ (void);
57 static ffelexHandler
ffelex_swallow_tokens_ (ffelexToken t
);
58 static ffelexToken
ffelex_token_new_ (void);
60 /* Pertaining to the geometry of the input file. */
62 /* Initial size for card image to be allocated. */
63 #define FFELEX_columnINITIAL_SIZE_ 255
65 /* The card image itself, which grows as source lines get longer. It
66 has room for ffelex_card_size_ + 8 characters, and the length of the
67 current image is ffelex_card_length_. (The + 8 characters are made
68 available for easy handling of tabs and such.) */
69 static char *ffelex_card_image_
;
70 static ffewhereColumnNumber ffelex_card_size_
;
71 static ffewhereColumnNumber ffelex_card_length_
;
73 /* Max width for free-form lines (ISO F90). */
74 #define FFELEX_FREE_MAX_COLUMNS_ 132
76 /* True if we saw a tab on the current line, as this (currently) means
77 the line is therefore treated as though final_nontab_column_ were
79 static bool ffelex_saw_tab_
;
81 /* TRUE if current line is known to be erroneous, so don't bother
82 expanding room for it just to display it. */
83 static bool ffelex_bad_line_
= FALSE
;
85 /* Last column for vanilla, i.e. non-tabbed, line. Usually 72 or 132. */
86 static ffewhereColumnNumber ffelex_final_nontab_column_
;
88 /* Array for quickly deciding what kind of line the current card has,
89 based on its first character. */
90 static ffelexType ffelex_first_char_
[256];
92 /* Pertaining to file management. */
94 /* The wf argument of the most recent active ffelex_file_(fixed,free)
96 static GTY (()) ffewhereFile ffelex_current_wf_
;
98 /* TRUE if an INCLUDE statement can be processed (ffelex_set_include
100 static bool ffelex_permit_include_
;
102 /* TRUE if an INCLUDE statement is pending (ffelex_set_include has been
104 static bool ffelex_set_include_
;
106 /* Information on the pending INCLUDE file. */
107 static FILE *ffelex_include_file_
;
108 static bool ffelex_include_free_form_
;
109 static GTY(()) ffewhereFile ffelex_include_wherefile_
;
111 /* Current master line count. */
112 static ffewhereLineNumber ffelex_linecount_current_
;
113 /* Next master line count. */
114 static ffewhereLineNumber ffelex_linecount_next_
;
116 /* ffewhere info on the latest (currently active) line read from the
117 active source file. */
118 static ffewhereLine ffelex_current_wl_
;
119 static ffewhereColumn ffelex_current_wc_
;
121 /* Pertaining to tokens in general. */
123 /* Initial capacity for text in a CHARACTER/HOLLERITH/NAME/NAMES/NUMBER
125 #define FFELEX_columnTOKEN_SIZE_ 63
126 #if FFELEX_columnTOKEN_SIZE_ < FFEWHERE_indexMAX
127 #error "token size too small!"
130 /* Current token being lexed. */
131 static ffelexToken ffelex_token_
;
133 /* Handler for current token. */
134 static ffelexHandler ffelex_handler_
;
136 /* TRUE if fixed-form lexer is to generate NAMES instead of NAME tokens. */
137 static bool ffelex_names_
;
139 /* TRUE if both lexers are to generate NAMES instead of NAME tokens. */
140 static bool ffelex_names_pure_
;
142 /* TRUE if 0-9 starts a NAME token instead of NUMBER, for parsing hex
144 static bool ffelex_hexnum_
;
146 /* For ffelex_swallow_tokens(). */
147 static ffelexHandler ffelex_eos_handler_
;
149 /* Number of tokens sent since last EOS or beginning of input file
150 (include INCLUDEd files). */
151 static unsigned long int ffelex_number_of_tokens_
;
153 /* Number of labels sent (as NUMBER tokens) since last reset of
154 ffelex_number_of_tokens_ to 0, should be 0 or 1 in most cases.
155 (Fixed-form source only.) */
156 static unsigned long int ffelex_label_tokens_
;
158 /* Metering for token management, to catch token-memory leaks. */
159 static long int ffelex_total_tokens_
= 0;
160 static long int ffelex_old_total_tokens_
= 1;
161 static long int ffelex_token_nextid_
= 0;
163 /* Pertaining to lexing CHARACTER and HOLLERITH tokens. */
165 /* >0 if a Hollerith constant of that length might be in mid-lex, used
166 when the next character seen is 'H' or 'h' to enter HOLLERITH lexing
167 mode (see ffelex_raw_mode_). */
168 static long int ffelex_expecting_hollerith_
;
170 /* -3: Backslash (escape) sequence being lexed in CHARACTER.
171 -2: Possible closing apostrophe/quote seen in CHARACTER.
172 -1: Lexing CHARACTER.
173 0: Not lexing CHARACTER or HOLLERITH.
174 >0: Lexing HOLLERITH, value is # chars remaining to expect. */
175 static long int ffelex_raw_mode_
;
177 /* When lexing CHARACTER, open quote/apostrophe (either ' or "). */
178 static char ffelex_raw_char_
;
180 /* TRUE when backslash processing had to use most recent character
181 to finish its state engine, but that character is not part of
182 the backslash sequence, so must be reconsidered as a "normal"
183 character in CHARACTER/HOLLERITH lexing. */
184 static bool ffelex_backslash_reconsider_
= FALSE
;
186 /* Characters preread before lexing happened (might include EOF). */
187 static int *ffelex_kludge_chars_
= NULL
;
189 /* Doing the kludge processing, so not initialized yet. */
190 static bool ffelex_kludge_flag_
= FALSE
;
192 /* The beginning of a (possible) CHARACTER/HOLLERITH token. */
193 static ffewhereLine ffelex_raw_where_line_
;
194 static ffewhereColumn ffelex_raw_where_col_
;
197 /* Call this to append another character to the current token. If it isn't
198 currently big enough for it, it will be enlarged. The current token
199 must be a CHARACTER, HOLLERITH, NAME, NAMES, or NUMBER. */
202 ffelex_append_to_token_ (char c
)
204 if (ffelex_token_
->text
== NULL
)
207 = malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
208 FFELEX_columnTOKEN_SIZE_
+ 1);
209 ffelex_token_
->size
= FFELEX_columnTOKEN_SIZE_
;
210 ffelex_token_
->length
= 0;
212 else if (ffelex_token_
->length
>= ffelex_token_
->size
)
215 = malloc_resize_ksr (malloc_pool_image (),
217 (ffelex_token_
->size
<< 1) + 1,
218 ffelex_token_
->size
+ 1);
219 ffelex_token_
->size
<<= 1;
220 assert (ffelex_token_
->length
< ffelex_token_
->size
);
222 ffelex_token_
->text
[ffelex_token_
->length
++] = c
;
225 /* Do backslash (escape) processing for a CHARACTER/HOLLERITH token
229 ffelex_backslash_ (int c
, ffewhereColumnNumber col
)
231 static int state
= 0;
232 static unsigned int count
;
234 static unsigned int firstdig
= 0;
236 static ffewhereLineNumber line
;
237 static ffewhereColumnNumber column
;
239 /* See gcc/c-lex.c readescape() for a straightforward version
240 of this state engine for handling backslashes in character/
241 hollerith constants. */
249 && (ffelex_raw_mode_
!= 0)
250 && ffe_is_backslash ())
254 line
= ffelex_linecount_current_
;
260 state
= 0; /* Assume simple case. */
270 case '0': case '1': case '2': case '3': case '4':
271 case '5': case '6': case '7':
277 case '\\': case '\'': case '"':
280 #if 0 /* Inappropriate for Fortran. */
282 ffelex_next_line_ ();
288 return TARGET_NEWLINE
;
320 /* xgettext:no-c-format */
321 ffebad_start_msg_lex ("Non-ISO-C-standard escape sequence `\\%A' at %0",
322 FFEBAD_severityPEDANTIC
);
323 ffelex_bad_here_ (0, line
, column
);
327 return (c
== 'E' || c
== 'e') ? 033 : c
;
333 if (c
>= 040 && c
< 0177)
339 /* xgettext:no-c-format */
340 ffebad_start_msg_lex ("Unknown escape sequence `\\%A' at %0",
341 FFEBAD_severityPEDANTIC
);
342 ffelex_bad_here_ (0, line
, column
);
348 /* xgettext:no-c-format */
349 ffebad_start_msg_lex ("Unterminated escape sequence `\\' at %0",
350 FFEBAD_severityPEDANTIC
);
351 ffelex_bad_here_ (0, line
, column
);
358 sprintf (&m
[0], "%x", c
);
359 /* xgettext:no-c-format */
360 ffebad_start_msg_lex ("Unknown escape sequence `\\' followed by char code 0x%A at %0",
361 FFEBAD_severityPEDANTIC
);
362 ffelex_bad_here_ (0, line
, column
);
372 code
= (code
* 16) + hex_value (c
);
373 if (code
!= 0 || count
!= 0)
387 /* xgettext:no-c-format */
388 ffebad_start_msg_lex ("\\x used at %0 with no following hex digits",
389 FFEBAD_severityFATAL
);
390 ffelex_bad_here_ (0, line
, column
);
394 /* Digits are all 0's. Ok. */
396 else if ((count
- 1) * 4 >= TYPE_PRECISION (integer_type_node
)
398 && ((1 << (TYPE_PRECISION (integer_type_node
) - (count
- 1) * 4))
401 /* xgettext:no-c-format */
402 ffebad_start_msg_lex ("Hex escape at %0 out of range",
403 FFEBAD_severityPEDANTIC
);
404 ffelex_bad_here_ (0, line
, column
);
410 if ((c
<= '7') && (c
>= '0') && (count
++ < 3))
412 code
= (code
* 8) + (c
- '0');
419 assert ("bad backslash state" == NULL
);
423 /* Come here when code has a built character, and c is the next
424 character that might (or might not) be the next one in the constant. */
426 /* Don't bother doing this check for each character going into
427 CHARACTER or HOLLERITH constants, just the escaped-value ones.
428 gcc apparently checks every single character, which seems
429 like it'd be kinda slow and not worth doing anyway. */
432 && TYPE_PRECISION (char_type_node
) < HOST_BITS_PER_INT
433 && code
>= (1 << TYPE_PRECISION (char_type_node
)))
435 /* xgettext:no-c-format */
436 ffebad_start_msg_lex ("Escape sequence at %0 out of range for character",
437 FFEBAD_severityFATAL
);
438 ffelex_bad_here_ (0, line
, column
);
444 /* Known end of constant, just append this character. */
445 ffelex_append_to_token_ (code
);
446 if (ffelex_raw_mode_
> 0)
451 /* Have two characters to handle. Do the first, then leave it to the
452 caller to detect anything special about the second. */
454 ffelex_append_to_token_ (code
);
455 if (ffelex_raw_mode_
> 0)
457 ffelex_backslash_reconsider_
= TRUE
;
461 /* ffelex_bad_1_ -- Issue diagnostic with one source point
463 ffelex_bad_1_(FFEBAD_SOME_ERROR,ffelex_linecount_current_,column + 1);
465 Creates ffewhere line and column objects for the source point, sends them
466 along with the error code to ffebad, then kills the line and column
467 objects before returning. */
470 ffelex_bad_1_ (ffebad errnum
, ffewhereLineNumber ln0
, ffewhereColumnNumber cn0
)
475 wl0
= ffewhere_line_new (ln0
);
476 wc0
= ffewhere_column_new (cn0
);
477 ffebad_start_lex (errnum
);
478 ffebad_here (0, wl0
, wc0
);
480 ffewhere_line_kill (wl0
);
481 ffewhere_column_kill (wc0
);
484 /* ffelex_bad_2_ -- Issue diagnostic with two source points
486 ffelex_bad_2_(FFEBAD_SOME_ERROR,ffelex_linecount_current_,column + 1,
487 otherline,othercolumn);
489 Creates ffewhere line and column objects for the source points, sends them
490 along with the error code to ffebad, then kills the line and column
491 objects before returning. */
494 ffelex_bad_2_ (ffebad errnum
, ffewhereLineNumber ln0
, ffewhereColumnNumber cn0
,
495 ffewhereLineNumber ln1
, ffewhereColumnNumber cn1
)
497 ffewhereLine wl0
, wl1
;
498 ffewhereColumn wc0
, wc1
;
500 wl0
= ffewhere_line_new (ln0
);
501 wc0
= ffewhere_column_new (cn0
);
502 wl1
= ffewhere_line_new (ln1
);
503 wc1
= ffewhere_column_new (cn1
);
504 ffebad_start_lex (errnum
);
505 ffebad_here (0, wl0
, wc0
);
506 ffebad_here (1, wl1
, wc1
);
508 ffewhere_line_kill (wl0
);
509 ffewhere_column_kill (wc0
);
510 ffewhere_line_kill (wl1
);
511 ffewhere_column_kill (wc1
);
515 ffelex_bad_here_ (int n
, ffewhereLineNumber ln0
,
516 ffewhereColumnNumber cn0
)
521 wl0
= ffewhere_line_new (ln0
);
522 wc0
= ffewhere_column_new (cn0
);
523 ffebad_here (n
, wl0
, wc0
);
524 ffewhere_line_kill (wl0
);
525 ffewhere_column_kill (wc0
);
529 ffelex_getc_ (FILE *finput
)
533 if (ffelex_kludge_chars_
== NULL
)
534 return getc (finput
);
536 c
= *ffelex_kludge_chars_
++;
540 ffelex_kludge_chars_
= NULL
;
541 return getc (finput
);
545 ffelex_cfebackslash_ (int *use_d
, int *d
, FILE *finput
)
547 register int c
= getc (finput
);
549 register unsigned count
;
550 unsigned firstdig
= 0;
570 code
= (code
* 16) + hex_value (c
);
571 if (code
!= 0 || count
!= 0)
580 error ("\\x used with no following hex digits");
582 /* Digits are all 0's. Ok. */
584 else if ((count
- 1) * 4 >= TYPE_PRECISION (integer_type_node
)
587 << (TYPE_PRECISION (integer_type_node
) - (count
- 1)
590 pedwarn ("hex escape out of range");
593 case '0': case '1': case '2': case '3': case '4':
594 case '5': case '6': case '7':
597 while ((c
<= '7') && (c
>= '0') && (count
++ < 3))
599 code
= (code
* 8) + (c
- '0');
606 case '\\': case '\'': case '"':
610 ffelex_next_line_ ();
620 return TARGET_NEWLINE
;
643 pedwarn ("non-ANSI-standard escape sequence, `\\%c'", c
);
649 /* `\(', etc, are used at beginning of line to avoid confusing Emacs. */
653 /* `\%' is used to prevent SCCS from getting confused. */
656 pedwarn ("non-ISO escape sequence `\\%c'", c
);
659 if (c
>= 040 && c
< 0177)
660 pedwarn ("unknown escape sequence `\\%c'", c
);
662 pedwarn ("unknown escape sequence: `\\' followed by char code 0x%x", c
);
666 /* A miniature version of the C front-end lexer. */
669 ffelex_cfelex_ (ffelexToken
*xtoken
, FILE *finput
, int c
)
676 register unsigned buffer_length
;
678 if ((*xtoken
!= NULL
) && !ffelex_kludge_flag_
)
679 ffelex_token_kill (*xtoken
);
683 case '0': case '1': case '2': case '3': case '4':
684 case '5': case '6': case '7': case '8': case '9':
685 buffer_length
= ARRAY_SIZE (buff
);
688 r
= &buff
[buffer_length
];
694 register unsigned bytes_used
= (p
- q
);
699 q
= xmalloc (buffer_length
);
700 memcpy (q
, buff
, bytes_used
);
703 q
= xrealloc (q
, buffer_length
);
705 r
= &q
[buffer_length
];
707 c
= ffelex_getc_ (finput
);
712 token
= ffelex_token_new_number (q
, ffewhere_line_unknown (),
713 ffewhere_column_unknown ());
721 buffer_length
= ARRAY_SIZE (buff
);
724 r
= &buff
[buffer_length
];
725 c
= ffelex_getc_ (finput
);
739 case '\\': /* ~~~~~ */
740 c
= ffelex_cfebackslash_ (&use_d
, &d
, finput
);
745 error ("badly formed directive -- no closing quote");
755 if (use_d
!= 2) /* 0=>c, 1=>cd, 2=>nil. */
760 register unsigned bytes_used
= (p
- q
);
762 buffer_length
= bytes_used
* 2;
765 q
= xmalloc (buffer_length
);
766 memcpy (q
, buff
, bytes_used
);
769 q
= xrealloc (q
, buffer_length
);
771 r
= &q
[buffer_length
];
780 token
= ffelex_token_new_character (q
, ffewhere_line_unknown (),
781 ffewhere_column_unknown ());
798 ffelex_file_pop_ (const char *filename
)
800 if (input_file_stack
->next
)
802 struct file_stack
*p
= input_file_stack
;
803 input_file_stack
= p
->next
;
805 input_file_stack_tick
++;
806 (*debug_hooks
->end_source_file
) (input_file_stack
->location
.line
);
809 error ("#-lines for entering and leaving files don't match");
811 /* Now that we've pushed or popped the input stack,
812 update the name in the top element. */
813 if (input_file_stack
)
814 input_file_stack
->location
.file
= filename
;
818 ffelex_file_push_ (int old_lineno
, const char *filename
)
820 struct file_stack
*p
= xmalloc (sizeof (struct file_stack
));
822 input_file_stack
->location
.line
= old_lineno
;
823 p
->next
= input_file_stack
;
824 p
->location
.file
= filename
;
825 input_file_stack
= p
;
826 input_file_stack_tick
++;
828 (*debug_hooks
->start_source_file
) (0, filename
);
830 /* Now that we've pushed or popped the input stack,
831 update the name in the top element. */
832 if (input_file_stack
)
833 input_file_stack
->location
.file
= filename
;
836 /* Prepare to finish a statement-in-progress by sending the current
837 token, if any, then setting up EOS as the current token with the
838 appropriate current pointer. The caller can then move the current
839 pointer before actually sending EOS, if desired, as it is in
840 typical fixed-form cases. */
843 ffelex_prepare_eos_ (void)
845 if (ffelex_token_
->type
!= FFELEX_typeNONE
)
847 ffelex_backslash_ (EOF
, 0);
849 switch (ffelex_raw_mode_
)
855 ffebad_start_lex ((ffelex_raw_char_
== '\'') ? FFEBAD_NO_CLOSING_APOSTROPHE
856 : FFEBAD_NO_CLOSING_QUOTE
);
857 ffebad_here (0, ffelex_token_
->where_line
, ffelex_token_
->where_col
);
858 ffebad_here (1, ffelex_current_wl_
, ffelex_current_wc_
);
869 ffebad_start_lex (FFEBAD_NOT_ENOUGH_HOLLERITH_CHARS
);
870 ffebad_here (0, ffelex_token_
->where_line
, ffelex_token_
->where_col
);
871 ffebad_here (1, ffelex_current_wl_
, ffelex_current_wc_
);
872 sprintf (num
, "%lu", (unsigned long) ffelex_raw_mode_
);
875 /* Make sure the token has some text, might as well fill up with spaces. */
878 ffelex_append_to_token_ (' ');
879 } while (--ffelex_raw_mode_
> 0);
883 ffelex_raw_mode_
= 0;
884 ffelex_send_token_ ();
886 ffelex_token_
->type
= FFELEX_typeEOS
;
887 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
888 ffelex_token_
->where_col
= ffewhere_column_use (ffelex_current_wc_
);
892 ffelex_finish_statement_ (void)
894 if ((ffelex_number_of_tokens_
== 0)
895 && (ffelex_token_
->type
== FFELEX_typeNONE
))
896 return; /* Don't have a statement pending. */
898 if (ffelex_token_
->type
!= FFELEX_typeEOS
)
899 ffelex_prepare_eos_ ();
901 ffelex_permit_include_
= TRUE
;
902 ffelex_send_token_ ();
903 ffelex_permit_include_
= FALSE
;
904 ffelex_number_of_tokens_
= 0;
905 ffelex_label_tokens_
= 0;
906 ffelex_names_
= TRUE
;
907 ffelex_names_pure_
= FALSE
; /* Probably not necessary. */
908 ffelex_hexnum_
= FALSE
;
910 if (!ffe_is_ffedebug ())
913 /* For debugging purposes only. */
915 if (ffelex_total_tokens_
!= ffelex_old_total_tokens_
)
917 fprintf (dmpout
, "; token_track had %ld tokens, now have %ld.\n",
918 ffelex_old_total_tokens_
, ffelex_total_tokens_
);
919 ffelex_old_total_tokens_
= ffelex_total_tokens_
;
923 /* Read a preprocessor directive line from file FINPUT. This function
924 returns either '\n' or EOF to indicate success or failure respectively.
925 Upon return, TEXT points to the contents of the line, which is stripped
926 of initial whitespace. The buffer pointed to by TEXT should not be
927 free'd and is overwritten by subsequent calls to this function. */
930 ffelex_get_directive_line_ (char **text
, FILE *finput
)
932 static char *directive_buffer
= NULL
;
933 static unsigned buffer_length
= 0;
935 register char *buffer_limit
;
936 register int looking_for
= 0;
937 register int char_escaped
= 0;
939 if (buffer_length
== 0)
941 directive_buffer
= xmalloc (128);
945 buffer_limit
= &directive_buffer
[buffer_length
];
947 for (p
= directive_buffer
; ; )
951 /* Make buffer bigger if it is full. */
952 if (p
>= buffer_limit
)
954 register unsigned bytes_used
= (p
- directive_buffer
);
957 directive_buffer
= xrealloc (directive_buffer
, buffer_length
);
958 p
= &directive_buffer
[bytes_used
];
959 buffer_limit
= &directive_buffer
[buffer_length
];
964 /* Discard initial whitespace. */
965 if ((c
== ' ' || c
== '\t') && p
== directive_buffer
)
968 /* Detect the end of the directive. */
969 if ((c
== '\n' && looking_for
== 0)
972 if (looking_for
!= 0)
973 error ("bad directive -- missing close-quote");
976 *text
= directive_buffer
;
982 ffelex_next_line_ ();
984 /* Handle string and character constant syntax. */
987 if (looking_for
== c
&& !char_escaped
)
988 looking_for
= 0; /* Found terminator... stop looking. */
991 if (c
== '\'' || c
== '"')
992 looking_for
= c
; /* Don't stop buffering until we see another
993 one of these (or an EOF). */
995 /* Handle backslash. */
996 char_escaped
= (c
== '\\' && ! char_escaped
);
1000 /* Handle # directives that make it through (or are generated by) the
1001 preprocessor. As much as reasonably possible, emulate the behavior
1002 of the gcc compiler phase cc1, though interactions between #include
1003 and INCLUDE might possibly produce bizarre results in terms of
1004 error reporting and the generation of debugging info vis-a-vis the
1005 locations of some things.
1007 Returns the next character unhandled, which is always newline or EOF. */
1010 ffelex_hash_ (FILE *finput
)
1013 ffelexToken token
= NULL
;
1015 /* Read first nonwhite char after the `#'. */
1017 c
= ffelex_getc_ (finput
);
1018 while (c
== ' ' || c
== '\t')
1019 c
= ffelex_getc_ (finput
);
1021 /* If a letter follows, then if the word here is `line', skip
1022 it and ignore it; otherwise, ignore the line, with an error
1023 if the word isn't `pragma', `ident', `define', or `undef'. */
1029 if (getc (finput
) == 'r'
1030 && getc (finput
) == 'a'
1031 && getc (finput
) == 'g'
1032 && getc (finput
) == 'm'
1033 && getc (finput
) == 'a'
1034 && ((c
= getc (finput
)) == ' ' || c
== '\t' || c
== '\n'
1042 if (getc (finput
) == 'e'
1043 && getc (finput
) == 'f'
1044 && getc (finput
) == 'i'
1045 && getc (finput
) == 'n'
1046 && getc (finput
) == 'e'
1047 && ((c
= getc (finput
)) == ' ' || c
== '\t' || c
== '\n'
1052 c
= ffelex_get_directive_line_ (&text
, finput
);
1054 if (debug_info_level
== DINFO_LEVEL_VERBOSE
)
1055 (*debug_hooks
->define
) (input_line
, text
);
1062 if (getc (finput
) == 'n'
1063 && getc (finput
) == 'd'
1064 && getc (finput
) == 'e'
1065 && getc (finput
) == 'f'
1066 && ((c
= getc (finput
)) == ' ' || c
== '\t' || c
== '\n'
1071 c
= ffelex_get_directive_line_ (&text
, finput
);
1073 if (debug_info_level
== DINFO_LEVEL_VERBOSE
)
1074 (*debug_hooks
->undef
) (input_line
, text
);
1081 if (getc (finput
) == 'i'
1082 && getc (finput
) == 'n'
1083 && getc (finput
) == 'e'
1084 && ((c
= getc (finput
)) == ' ' || c
== '\t'))
1089 if (getc (finput
) == 'd'
1090 && getc (finput
) == 'e'
1091 && getc (finput
) == 'n'
1092 && getc (finput
) == 't'
1093 && ((c
= getc (finput
)) == ' ' || c
== '\t'))
1095 /* #ident. The pedantic warning is now in cpp. */
1097 /* Here we have just seen `#ident '.
1098 A string constant should follow. */
1100 while (c
== ' ' || c
== '\t')
1103 /* If no argument, ignore the line. */
1104 if (c
== '\n' || c
== EOF
)
1107 c
= ffelex_cfelex_ (&token
, finput
, c
);
1110 || (ffelex_token_type (token
) != FFELEX_typeCHARACTER
))
1112 error ("invalid #ident");
1116 if (! flag_no_ident
)
1118 #ifdef ASM_OUTPUT_IDENT
1119 ASM_OUTPUT_IDENT (asm_out_file
,
1120 ffelex_token_text (token
));
1124 /* Skip the rest of this line. */
1129 error ("undefined or invalid # directive");
1134 /* Here we have either `#line' or `# <nonletter>'.
1135 In either case, it should be a line number; a digit should follow. */
1137 while (c
== ' ' || c
== '\t')
1138 c
= ffelex_getc_ (finput
);
1140 /* If the # is the only nonwhite char on the line,
1141 just ignore it. Check the new newline. */
1142 if (c
== '\n' || c
== EOF
)
1145 /* Something follows the #; read a token. */
1147 c
= ffelex_cfelex_ (&token
, finput
, c
);
1150 && (ffelex_token_type (token
) == FFELEX_typeNUMBER
))
1152 location_t old_loc
= input_location
;
1155 /* subtract one, because it is the following line that
1156 gets the specified number */
1157 int l
= atoi (ffelex_token_text (token
)) - 1;
1159 /* Is this the last nonwhite stuff on the line? */
1160 while (c
== ' ' || c
== '\t')
1161 c
= ffelex_getc_ (finput
);
1162 if (c
== '\n' || c
== EOF
)
1164 /* No more: store the line number and check following line. */
1166 if (!ffelex_kludge_flag_
)
1168 ffewhere_file_set (NULL
, TRUE
, (ffewhereLineNumber
) l
);
1171 ffelex_token_kill (token
);
1176 /* More follows: it must be a string constant (filename). */
1178 /* Read the string constant. */
1179 c
= ffelex_cfelex_ (&token
, finput
, c
);
1182 || (ffelex_token_type (token
) != FFELEX_typeCHARACTER
))
1184 error ("invalid #line");
1190 if (ffelex_kludge_flag_
)
1191 input_filename
= ggc_strdup (ffelex_token_text (token
));
1194 wf
= ffewhere_file_new (ffelex_token_text (token
),
1195 ffelex_token_length (token
));
1196 input_filename
= ffewhere_file_name (wf
);
1197 ffewhere_file_set (wf
, TRUE
, (ffewhereLineNumber
) l
);
1200 #if 0 /* Not sure what g77 should do with this yet. */
1201 /* Each change of file name
1202 reinitializes whether we are now in a system header. */
1203 in_system_header
= 0;
1206 if (main_input_filename
== 0)
1207 main_input_filename
= input_filename
;
1209 /* Is this the last nonwhite stuff on the line? */
1210 while (c
== ' ' || c
== '\t')
1212 if (c
== '\n' || c
== EOF
)
1214 if (!ffelex_kludge_flag_
)
1216 /* Update the name in the top element of input_file_stack. */
1217 if (input_file_stack
)
1218 input_file_stack
->location
.file
= input_filename
;
1221 ffelex_token_kill (token
);
1226 c
= ffelex_cfelex_ (&token
, finput
, c
);
1228 /* `1' after file name means entering new file.
1229 `2' after file name means just left a file. */
1232 && (ffelex_token_type (token
) == FFELEX_typeNUMBER
))
1234 int num
= atoi (ffelex_token_text (token
));
1236 if (ffelex_kludge_flag_
)
1239 input_filename
= old_loc
.file
;
1240 error ("use `#line ...' instead of `# ...' in first line");
1245 /* Pushing to a new file. */
1246 ffelex_file_push_ (old_loc
.line
, input_filename
);
1250 /* Popping out of a file. */
1251 ffelex_file_pop_ (input_filename
);
1254 /* Is this the last nonwhite stuff on the line? */
1255 while (c
== ' ' || c
== '\t')
1257 if (c
== '\n' || c
== EOF
)
1260 ffelex_token_kill (token
);
1264 c
= ffelex_cfelex_ (&token
, finput
, c
);
1267 /* `3' after file name means this is a system header file. */
1269 #if 0 /* Not sure what g77 should do with this yet. */
1271 && (ffelex_token_type (token
) == FFELEX_typeNUMBER
)
1272 && (atoi (ffelex_token_text (token
)) == 3))
1273 in_system_header
= 1;
1276 while (c
== ' ' || c
== '\t')
1278 if (((token
!= NULL
)
1279 || (c
!= '\n' && c
!= EOF
))
1280 && ffelex_kludge_flag_
)
1283 input_filename
= old_loc
.file
;
1284 error ("use `#line ...' instead of `# ...' in first line");
1286 if (c
== '\n' || c
== EOF
)
1288 if (token
!= NULL
&& !ffelex_kludge_flag_
)
1289 ffelex_token_kill (token
);
1294 error ("invalid #-line");
1296 /* skip the rest of this line. */
1298 if ((token
!= NULL
) && !ffelex_kludge_flag_
)
1299 ffelex_token_kill (token
);
1300 while ((c
= getc (finput
)) != EOF
&& c
!= '\n')
1305 /* "Image" a character onto the card image, return incremented column number.
1307 Normally invoking this function as in
1308 column = ffelex_image_char_ (c, column);
1309 is the same as doing:
1310 ffelex_card_image_[column++] = c;
1312 However, tabs and carriage returns are handled specially, to preserve
1313 the visual "image" of the input line (in most editors) in the card
1316 Carriage returns are ignored, as they are assumed to be followed
1319 A tab is handled by first doing:
1320 ffelex_card_image_[column++] = ' ';
1321 That is, it translates to at least one space. Then, as many spaces
1322 are imaged as necessary to bring the column number to the next tab
1323 position, where tab positions start in the ninth column and each
1324 eighth column afterwards. ALSO, a static var named ffelex_saw_tab_
1325 is set to TRUE to notify the lexer that a tab was seen.
1327 Columns are numbered and tab stops set as illustrated below:
1329 012345670123456701234567...
1333 xxxxxxx yyyyyyy zzzzzzz
1334 xxxxxxxx yyyyyyyy... */
1336 static ffewhereColumnNumber
1337 ffelex_image_char_ (int c
, ffewhereColumnNumber column
)
1339 ffewhereColumnNumber old_column
= column
;
1341 if (column
>= ffelex_card_size_
)
1343 ffewhereColumnNumber newmax
= ffelex_card_size_
<< 1;
1345 if (ffelex_bad_line_
)
1348 if ((newmax
>> 1) != ffelex_card_size_
)
1349 { /* Overflowed column number. */
1350 overflow
: /* :::::::::::::::::::: */
1352 ffelex_bad_line_
= TRUE
;
1353 strcpy (&ffelex_card_image_
[column
- 3], "...");
1354 ffelex_card_length_
= column
;
1355 ffelex_bad_1_ (FFEBAD_LINE_TOO_LONG
,
1356 ffelex_linecount_current_
, column
+ 1);
1361 = malloc_resize_ksr (malloc_pool_image (),
1364 ffelex_card_size_
+ 9);
1365 ffelex_card_size_
= newmax
;
1374 ffelex_saw_tab_
= TRUE
;
1375 ffelex_card_image_
[column
++] = ' ';
1376 while ((column
& 7) != 0)
1377 ffelex_card_image_
[column
++] = ' ';
1381 if (!ffelex_bad_line_
)
1383 ffelex_bad_line_
= TRUE
;
1384 strcpy (&ffelex_card_image_
[column
], "[\\0]");
1385 ffelex_card_length_
= column
+ 4;
1386 /* xgettext:no-c-format */
1387 ffebad_start_msg_lex ("Null character at %0 -- line ignored",
1388 FFEBAD_severityFATAL
);
1389 ffelex_bad_here_ (0, ffelex_linecount_current_
, column
+ 1);
1396 ffelex_card_image_
[column
++] = c
;
1400 if (column
< old_column
)
1402 column
= old_column
;
1403 goto overflow
; /* :::::::::::::::::::: */
1410 ffelex_include_ (void)
1412 ffewhereFile include_wherefile
= ffelex_include_wherefile_
;
1413 FILE *include_file
= ffelex_include_file_
;
1414 /* The rest of this is to push, and after the INCLUDE file is processed,
1415 pop, the static lexer state info that pertains to each particular
1418 ffewhereColumnNumber card_size
= ffelex_card_size_
;
1419 ffewhereColumnNumber card_length
= ffelex_card_length_
;
1420 ffewhereLine current_wl
= ffelex_current_wl_
;
1421 ffewhereColumn current_wc
= ffelex_current_wc_
;
1422 bool saw_tab
= ffelex_saw_tab_
;
1423 ffewhereColumnNumber final_nontab_column
= ffelex_final_nontab_column_
;
1424 ffewhereFile current_wf
= ffelex_current_wf_
;
1425 ffewhereLineNumber linecount_current
= ffelex_linecount_current_
;
1426 ffewhereLineNumber linecount_offset
1427 = ffewhere_line_filelinenum (current_wl
);
1428 location_t old_loc
= input_location
;
1430 if (card_length
!= 0)
1432 card_image
= malloc_new_ks (malloc_pool_image (),
1433 "FFELEX saved card image",
1435 memcpy (card_image
, ffelex_card_image_
, card_length
);
1440 ffelex_set_include_
= FALSE
;
1442 ffelex_next_line_ ();
1444 ffewhere_file_set (include_wherefile
, TRUE
, 0);
1446 ffelex_file_push_ (old_loc
.line
, ffewhere_file_name (include_wherefile
));
1448 if (ffelex_include_free_form_
)
1449 ffelex_file_free (include_wherefile
, include_file
);
1451 ffelex_file_fixed (include_wherefile
, include_file
);
1453 ffelex_file_pop_ (ffewhere_file_name (current_wf
));
1455 ffewhere_file_set (current_wf
, TRUE
, linecount_offset
);
1457 ffecom_close_include (include_file
);
1459 if (card_length
!= 0)
1461 assert (ffelex_card_size_
>= card_length
); /* It shrunk?? */
1462 memcpy (ffelex_card_image_
, card_image
, card_length
);
1464 ffelex_card_image_
[card_length
] = '\0';
1466 input_location
= old_loc
;
1467 ffelex_linecount_current_
= linecount_current
;
1468 ffelex_current_wf_
= current_wf
;
1469 ffelex_final_nontab_column_
= final_nontab_column
;
1470 ffelex_saw_tab_
= saw_tab
;
1471 ffelex_current_wc_
= current_wc
;
1472 ffelex_current_wl_
= current_wl
;
1473 ffelex_card_length_
= card_length
;
1474 ffelex_card_size_
= card_size
;
1477 /* ffelex_is_free_char_ctx_contin_ -- Character Context Continuation?
1479 ffewhereColumnNumber col;
1480 int c; // Char at col.
1481 if ((c == '&') && ffelex_is_free_char_ctx_contin_(col + 1))
1482 // We have a continuation indicator.
1484 If there are <n> spaces starting at ffelex_card_image_[col] up through
1485 the null character, where <n> is 0 or greater, returns TRUE. */
1488 ffelex_is_free_char_ctx_contin_ (ffewhereColumnNumber col
)
1490 while (ffelex_card_image_
[col
] != '\0')
1492 if (ffelex_card_image_
[col
++] != ' ')
1498 /* ffelex_is_free_nonc_ctx_contin_ -- Noncharacter Context Continuation?
1500 ffewhereColumnNumber col;
1501 int c; // Char at col.
1502 if ((c == '&') && ffelex_is_free_nonc_ctx_contin_(col + 1))
1503 // We have a continuation indicator.
1505 If there are <n> spaces starting at ffelex_card_image_[col] up through
1506 the null character or '!', where <n> is 0 or greater, returns TRUE. */
1509 ffelex_is_free_nonc_ctx_contin_ (ffewhereColumnNumber col
)
1511 while ((ffelex_card_image_
[col
] != '\0') && (ffelex_card_image_
[col
] != '!'))
1513 if (ffelex_card_image_
[col
++] != ' ')
1520 ffelex_next_line_ (void)
1522 ffelex_linecount_current_
= ffelex_linecount_next_
;
1523 ++ffelex_linecount_next_
;
1528 ffelex_send_token_ (void)
1530 ++ffelex_number_of_tokens_
;
1532 ffelex_backslash_ (EOF
, 0);
1534 if (ffelex_token_
->text
== NULL
)
1536 if (ffelex_token_
->type
== FFELEX_typeCHARACTER
)
1538 ffelex_append_to_token_ ('\0');
1539 ffelex_token_
->length
= 0;
1543 ffelex_token_
->text
[ffelex_token_
->length
] = '\0';
1545 assert (ffelex_raw_mode_
== 0);
1547 if (ffelex_token_
->type
== FFELEX_typeNAMES
)
1549 ffewhere_line_kill (ffelex_token_
->currentnames_line
);
1550 ffewhere_column_kill (ffelex_token_
->currentnames_col
);
1553 assert (ffelex_handler_
!= NULL
);
1554 ffelex_handler_
= (ffelexHandler
) (*ffelex_handler_
) (ffelex_token_
);
1555 assert (ffelex_handler_
!= NULL
);
1557 ffelex_token_kill (ffelex_token_
);
1559 ffelex_token_
= ffelex_token_new_ ();
1560 ffelex_token_
->uses
= 1;
1561 ffelex_token_
->text
= NULL
;
1562 if (ffelex_raw_mode_
< 0)
1564 ffelex_token_
->type
= FFELEX_typeCHARACTER
;
1565 ffelex_token_
->where_line
= ffelex_raw_where_line_
;
1566 ffelex_token_
->where_col
= ffelex_raw_where_col_
;
1567 ffelex_raw_where_line_
= ffewhere_line_unknown ();
1568 ffelex_raw_where_col_
= ffewhere_column_unknown ();
1572 ffelex_token_
->type
= FFELEX_typeNONE
;
1573 ffelex_token_
->where_line
= ffewhere_line_unknown ();
1574 ffelex_token_
->where_col
= ffewhere_column_unknown ();
1577 if (ffelex_set_include_
)
1581 /* ffelex_swallow_tokens_ -- Eat all tokens delivered to me
1583 return ffelex_swallow_tokens_;
1585 Return this handler when you don't want to look at any more tokens in the
1586 statement because you've encountered an unrecoverable error in the
1589 static ffelexHandler
1590 ffelex_swallow_tokens_ (ffelexToken t
)
1592 assert (ffelex_eos_handler_
!= NULL
);
1594 if ((ffelex_token_type (t
) == FFELEX_typeEOS
)
1595 || (ffelex_token_type (t
) == FFELEX_typeSEMICOLON
))
1596 return (ffelexHandler
) (*ffelex_eos_handler_
) (t
);
1598 return (ffelexHandler
) ffelex_swallow_tokens_
;
1602 ffelex_token_new_ (void)
1606 ++ffelex_total_tokens_
;
1608 t
= malloc_new_ks (malloc_pool_image (), "FFELEX token", sizeof (*t
));
1609 t
->id_
= ffelex_token_nextid_
++;
1614 ffelex_type_string_ (ffelexType type
)
1616 static const char *const types
[] = {
1618 "FFELEX_typeCOMMENT",
1624 "FFELEX_typeDOLLAR",
1626 "FFELEX_typePERCENT",
1627 "FFELEX_typeAMPERSAND",
1628 "FFELEX_typeAPOSTROPHE",
1629 "FFELEX_typeOPEN_PAREN",
1630 "FFELEX_typeCLOSE_PAREN",
1631 "FFELEX_typeASTERISK",
1634 "FFELEX_typePERIOD",
1636 "FFELEX_typeNUMBER",
1637 "FFELEX_typeOPEN_ANGLE",
1638 "FFELEX_typeEQUALS",
1639 "FFELEX_typeCLOSE_ANGLE",
1643 "FFELEX_typeCONCAT",
1646 "FFELEX_typeHOLLERITH",
1647 "FFELEX_typeCHARACTER",
1649 "FFELEX_typeSEMICOLON",
1650 "FFELEX_typeUNDERSCORE",
1651 "FFELEX_typeQUESTION",
1652 "FFELEX_typeOPEN_ARRAY",
1653 "FFELEX_typeCLOSE_ARRAY",
1654 "FFELEX_typeCOLONCOLON",
1655 "FFELEX_typeREL_LE",
1656 "FFELEX_typeREL_NE",
1657 "FFELEX_typeREL_EQ",
1658 "FFELEX_typePOINTS",
1662 if (type
>= ARRAY_SIZE (types
))
1668 ffelex_display_token (ffelexToken t
)
1673 fprintf (dmpout
, "; Token #%lu is %s (line %" ffewhereLineNumber_f
"u, col %"
1674 ffewhereColumnNumber_f
"u)",
1676 ffelex_type_string_ (t
->type
),
1677 ffewhere_line_number (t
->where_line
),
1678 ffewhere_column_number (t
->where_col
));
1680 if (t
->text
!= NULL
)
1681 fprintf (dmpout
, ": \"%.*s\"\n",
1685 fprintf (dmpout
, ".\n");
1688 /* ffelex_expecting_character -- Tells if next token expected to be CHARACTER
1690 if (ffelex_expecting_character())
1691 // next token delivered by lexer will be CHARACTER.
1693 If the most recent call to ffelex_set_expecting_hollerith since the last
1694 token was delivered by the lexer passed a length of -1, then we return
1695 TRUE, because the next token we deliver will be typeCHARACTER, else we
1699 ffelex_expecting_character (void)
1701 return (ffelex_raw_mode_
!= 0);
1704 /* ffelex_file_fixed -- Lex a given file in fixed source form
1708 ffelex_file_fixed(wf,f);
1710 Lexes the file according to Fortran 90 ANSI + VXT specifications. */
1713 ffelex_file_fixed (ffewhereFile wf
, FILE *f
)
1715 register int c
= 0; /* Character currently under consideration. */
1716 register ffewhereColumnNumber column
= 0; /* Not really; 0 means column 1... */
1717 bool disallow_continuation_line
;
1718 bool ignore_disallowed_continuation
= FALSE
;
1719 int latest_char_in_file
= 0; /* For getting back into comment-skipping
1722 ffewhereColumnNumber first_label_char
; /* First char of label --
1724 char label_string
[6]; /* Text of label. */
1725 int labi
; /* Length of label text. */
1726 bool finish_statement
; /* Previous statement finished? */
1727 bool have_content
; /* This line have content? */
1728 bool just_do_label
; /* Nothing but label (and continuation?) on
1731 /* Lex is called for a particular file, not for a particular program unit.
1732 Yet the two events do share common characteristics. The first line in a
1733 file or in a program unit cannot be a continuation line. No token can
1734 be in mid-formation. No current label for the statement exists, since
1735 there is no current statement. */
1737 assert (ffelex_handler_
!= NULL
);
1740 input_filename
= ffewhere_file_name (wf
);
1741 ffelex_current_wf_
= wf
;
1742 disallow_continuation_line
= TRUE
;
1743 ignore_disallowed_continuation
= FALSE
;
1744 ffelex_token_
->type
= FFELEX_typeNONE
;
1745 ffelex_number_of_tokens_
= 0;
1746 ffelex_label_tokens_
= 0;
1747 ffelex_current_wl_
= ffewhere_line_unknown ();
1748 ffelex_current_wc_
= ffewhere_column_unknown ();
1749 latest_char_in_file
= '\n';
1751 goto first_line
; /* :::::::::::::::::::: */
1753 /* Come here to get a new line. */
1755 beginning_of_line
: /* :::::::::::::::::::: */
1757 disallow_continuation_line
= FALSE
;
1759 /* Come here directly when last line didn't clarify the continuation issue. */
1761 beginning_of_line_again
: /* :::::::::::::::::::: */
1763 first_line
: /* :::::::::::::::::::: */
1765 c
= latest_char_in_file
;
1766 if ((c
== EOF
) || ((c
= ffelex_getc_ (f
)) == EOF
))
1769 end_of_file
: /* :::::::::::::::::::: */
1771 /* Line ending in EOF instead of \n still counts as a whole line. */
1773 ffelex_finish_statement_ ();
1774 ffewhere_line_kill (ffelex_current_wl_
);
1775 ffewhere_column_kill (ffelex_current_wc_
);
1776 return (ffelexHandler
) ffelex_handler_
;
1779 ffelex_next_line_ ();
1781 ffelex_bad_line_
= FALSE
;
1783 /* Skip over comment (and otherwise ignored) lines as quickly as possible! */
1785 while (((lextype
= ffelex_first_char_
[c
]) == FFELEX_typeCOMMENT
)
1786 || (lextype
== FFELEX_typeERROR
)
1787 || (lextype
== FFELEX_typeSLASH
)
1788 || (lextype
== FFELEX_typeHASH
))
1790 /* Test most frequent type of line first, etc. */
1791 if ((lextype
== FFELEX_typeCOMMENT
)
1792 || ((lextype
== FFELEX_typeSLASH
)
1793 && ((c
= getc (f
)) == '*'))) /* NOTE SIDE-EFFECT. */
1795 /* Typical case (straight comment), just ignore rest of line. */
1796 comment_line
: /* :::::::::::::::::::: */
1798 while ((c
!= '\n') && (c
!= EOF
))
1801 else if (lextype
== FFELEX_typeHASH
)
1802 c
= ffelex_hash_ (f
);
1803 else if (lextype
== FFELEX_typeSLASH
)
1805 /* SIDE-EFFECT ABOVE HAS HAPPENED. */
1806 ffelex_card_image_
[0] = '/';
1807 ffelex_card_image_
[1] = c
;
1809 goto bad_first_character
; /* :::::::::::::::::::: */
1812 /* typeERROR or unsupported typeHASH. */
1813 { /* Bad first character, get line and display
1815 column
= ffelex_image_char_ (c
, 0);
1817 bad_first_character
: /* :::::::::::::::::::: */
1819 ffelex_bad_line_
= TRUE
;
1820 while (((c
= getc (f
)) != '\n') && (c
!= EOF
))
1821 column
= ffelex_image_char_ (c
, column
);
1822 ffelex_card_image_
[column
] = '\0';
1823 ffelex_card_length_
= column
;
1824 ffelex_bad_1_ (FFEBAD_FIRST_CHAR_INVALID
,
1825 ffelex_linecount_current_
, 1);
1828 /* Read past last char in line. */
1832 ffelex_next_line_ ();
1833 goto end_of_file
; /* :::::::::::::::::::: */
1838 ffelex_next_line_ ();
1841 goto end_of_file
; /* :::::::::::::::::::: */
1843 ffelex_bad_line_
= FALSE
;
1844 } /* while [c, first char, means comment] */
1848 || (ffelex_final_nontab_column_
== 0);
1850 if (lextype
== FFELEX_typeDEBUG
)
1851 c
= ' '; /* A 'D' or 'd' in column 1 with the
1852 debug-lines option on. */
1854 column
= ffelex_image_char_ (c
, 0);
1856 /* Read the entire line in as is (with whitespace processing). */
1858 while (((c
= getc (f
)) != '\n') && (c
!= EOF
))
1859 column
= ffelex_image_char_ (c
, column
);
1861 if (ffelex_bad_line_
)
1863 ffelex_card_image_
[column
] = '\0';
1864 ffelex_card_length_
= column
;
1865 goto comment_line
; /* :::::::::::::::::::: */
1868 /* If no tab, cut off line after column 72/132. */
1870 if (!ffelex_saw_tab_
&& (column
> ffelex_final_nontab_column_
))
1872 /* Technically, we should now fill ffelex_card_image_ up thru column
1873 72/132 with spaces, since character/hollerith constants must count
1874 them in that manner. To save CPU time in several ways (avoid a loop
1875 here that would be used only when we actually end a line in
1876 character-constant mode; avoid writing memory unnecessarily; avoid a
1877 loop later checking spaces when not scanning for character-constant
1878 characters), we don't do this, and we do the appropriate thing when
1879 we encounter end-of-line while actually processing a character
1882 column
= ffelex_final_nontab_column_
;
1885 ffelex_card_image_
[column
] = '\0';
1886 ffelex_card_length_
= column
;
1888 /* Save next char in file so we can use register-based c while analyzing
1889 line we just read. */
1891 latest_char_in_file
= c
; /* Should be either '\n' or EOF. */
1893 have_content
= FALSE
;
1895 /* Handle label, if any. */
1898 first_label_char
= FFEWHERE_columnUNKNOWN
;
1899 for (column
= 0; column
< 5; ++column
)
1901 switch (c
= ffelex_card_image_
[column
])
1905 goto stop_looking
; /* :::::::::::::::::::: */
1920 label_string
[labi
++] = c
;
1921 if (first_label_char
== FFEWHERE_columnUNKNOWN
)
1922 first_label_char
= column
+ 1;
1928 ffelex_bad_1_ (FFEBAD_LABEL_FIELD_NOT_NUMERIC
,
1929 ffelex_linecount_current_
,
1931 goto beginning_of_line_again
; /* :::::::::::::::::::: */
1933 if (ffe_is_pedantic ())
1934 ffelex_bad_1_ (FFEBAD_AMPERSAND
,
1935 ffelex_linecount_current_
, 1);
1936 finish_statement
= FALSE
;
1937 just_do_label
= FALSE
;
1938 goto got_a_continuation
; /* :::::::::::::::::::: */
1941 if (ffelex_card_image_
[column
+ 1] == '*')
1942 goto stop_looking
; /* :::::::::::::::::::: */
1945 ffelex_bad_1_ (FFEBAD_LABEL_FIELD_NOT_NUMERIC
,
1946 ffelex_linecount_current_
, column
+ 1);
1947 goto beginning_of_line_again
; /* :::::::::::::::::::: */
1951 stop_looking
: /* :::::::::::::::::::: */
1953 label_string
[labi
] = '\0';
1955 /* Find first nonblank char starting with continuation column. */
1957 if (column
== 5) /* In which case we didn't see end of line in
1959 while ((c
= ffelex_card_image_
[column
]) == ' ')
1962 /* Now we're trying to figure out whether this is a continuation line and
1963 whether there's anything else of substance on the line. The cases are
1966 1. If a line has an explicit continuation character (other than the digit
1967 zero), then if it also has a label, the label is ignored and an error
1968 message is printed. Any remaining text on the line is passed to the
1969 parser tasks, thus even an all-blank line (possibly with an ignored
1970 label) aside from a positive continuation character might have meaning
1971 in the midst of a character or hollerith constant.
1973 2. If a line has no explicit continuation character (that is, it has a
1974 space in column 6 and the first non-space character past column 6 is
1975 not a digit 0-9), then there are two possibilities:
1977 A. A label is present and/or a non-space (and non-comment) character
1978 appears somewhere after column 6. Terminate processing of the previous
1979 statement, if any, send the new label for the next statement, if any,
1980 and start processing a new statement with this non-blank character, if
1983 B. The line is essentially blank, except for a possible comment character.
1984 Don't terminate processing of the previous statement and don't pass any
1985 characters to the parser tasks, since the line is not flagged as a
1986 continuation line. We treat it just like a completely blank line.
1988 3. If a line has a continuation character of zero (0), then we terminate
1989 processing of the previous statement, if any, send the new label for the
1990 next statement, if any, and start processing a new statement, if any
1991 non-blank characters are present.
1993 If, when checking to see if we should terminate the previous statement, it
1994 is found that there is no previous statement but that there is an
1995 outstanding label, substitute CONTINUE as the statement for the label
1996 and display an error message. */
1998 finish_statement
= FALSE
;
1999 just_do_label
= FALSE
;
2003 case '!': /* ANSI Fortran 90 says ! in column 6 is
2005 /* VXT Fortran says ! anywhere is comment, even column 6. */
2006 if (ffe_is_vxt () || (column
!= 5))
2007 goto no_tokens_on_line
; /* :::::::::::::::::::: */
2008 goto got_a_continuation
; /* :::::::::::::::::::: */
2011 if (ffelex_card_image_
[column
+ 1] != '*')
2012 goto some_other_character
; /* :::::::::::::::::::: */
2016 /* This seems right to do. But it is close to call, since / * starting
2017 in column 6 will thus be interpreted as a continuation line
2018 beginning with '*'. */
2020 goto got_a_continuation
;/* :::::::::::::::::::: */
2024 /* End of line. Therefore may be continued-through line, so handle
2025 pending label as possible to-be-continued and drive end-of-statement
2026 for any previous statement, else treat as blank line. */
2028 no_tokens_on_line
: /* :::::::::::::::::::: */
2030 if (ffe_is_pedantic () && (c
== '/'))
2031 ffelex_bad_1_ (FFEBAD_NON_ANSI_COMMENT
,
2032 ffelex_linecount_current_
, column
+ 1);
2033 if (first_label_char
!= FFEWHERE_columnUNKNOWN
)
2034 { /* Can't be a continued-through line if it
2036 finish_statement
= TRUE
;
2037 have_content
= TRUE
;
2038 just_do_label
= TRUE
;
2041 goto beginning_of_line_again
; /* :::::::::::::::::::: */
2044 if (ffe_is_pedantic () && (column
!= 5))
2045 ffelex_bad_1_ (FFEBAD_NON_ANSI_CONTINUATION_COLUMN
,
2046 ffelex_linecount_current_
, column
+ 1);
2047 finish_statement
= TRUE
;
2048 goto check_for_content
; /* :::::::::::::::::::: */
2060 /* NOTE: This label can be reached directly from the code
2061 that lexes the label field in columns 1-5. */
2062 got_a_continuation
: /* :::::::::::::::::::: */
2064 if (first_label_char
!= FFEWHERE_columnUNKNOWN
)
2066 ffelex_bad_2_ (FFEBAD_LABEL_ON_CONTINUATION
,
2067 ffelex_linecount_current_
,
2069 ffelex_linecount_current_
,
2071 first_label_char
= FFEWHERE_columnUNKNOWN
;
2073 if (disallow_continuation_line
)
2075 if (!ignore_disallowed_continuation
)
2076 ffelex_bad_1_ (FFEBAD_INVALID_CONTINUATION
,
2077 ffelex_linecount_current_
, column
+ 1);
2078 goto beginning_of_line_again
; /* :::::::::::::::::::: */
2080 if (ffe_is_pedantic () && (column
!= 5))
2081 ffelex_bad_1_ (FFEBAD_NON_ANSI_CONTINUATION_COLUMN
,
2082 ffelex_linecount_current_
, column
+ 1);
2083 if ((ffelex_raw_mode_
!= 0)
2084 && (((c
= ffelex_card_image_
[column
+ 1]) != '\0')
2085 || !ffelex_saw_tab_
))
2088 have_content
= TRUE
;
2092 check_for_content
: /* :::::::::::::::::::: */
2094 while ((c
= ffelex_card_image_
[++column
]) == ' ')
2099 && (ffelex_card_image_
[column
+ 1] == '*')))
2101 if (ffe_is_pedantic () && (c
== '/'))
2102 ffelex_bad_1_ (FFEBAD_NON_ANSI_COMMENT
,
2103 ffelex_linecount_current_
, column
+ 1);
2104 just_do_label
= TRUE
;
2107 have_content
= TRUE
;
2112 some_other_character
: /* :::::::::::::::::::: */
2115 goto got_a_continuation
;/* :::::::::::::::::::: */
2117 /* Here is the very normal case of a regular character starting in
2118 column 7 or beyond with a blank in column 6. */
2120 finish_statement
= TRUE
;
2121 have_content
= TRUE
;
2126 || (first_label_char
!= FFEWHERE_columnUNKNOWN
))
2128 /* The line has content of some kind, install new end-statement
2129 point for error messages. Note that "content" includes cases
2130 where there's little apparent content but enough to finish
2131 a statement. That's because finishing a statement can trigger
2132 an impending INCLUDE, and that requires accurate line info being
2133 maintained by the lexer. */
2135 if (finish_statement
)
2136 ffelex_prepare_eos_ (); /* Prepare EOS before we move current pointer. */
2138 ffewhere_line_kill (ffelex_current_wl_
);
2139 ffewhere_column_kill (ffelex_current_wc_
);
2140 ffelex_current_wl_
= ffewhere_line_new (ffelex_linecount_current_
);
2141 ffelex_current_wc_
= ffewhere_column_new (ffelex_card_length_
+ 1);
2144 /* We delay this for a combination of reasons. Mainly, it can start
2145 INCLUDE processing, and we want to delay that until the lexer's
2146 info on the line is coherent. And we want to delay that until we're
2147 sure there's a reason to make that info coherent, to avoid saving
2148 lots of useless lines. */
2150 if (finish_statement
)
2151 ffelex_finish_statement_ ();
2153 /* If label is present, enclose it in a NUMBER token and send it along. */
2155 if (first_label_char
!= FFEWHERE_columnUNKNOWN
)
2157 assert (ffelex_token_
->type
== FFELEX_typeNONE
);
2158 ffelex_token_
->type
= FFELEX_typeNUMBER
;
2159 ffelex_append_to_token_ ('\0'); /* Make room for label text. */
2160 strcpy (ffelex_token_
->text
, label_string
);
2161 ffelex_token_
->where_line
2162 = ffewhere_line_use (ffelex_current_wl_
);
2163 ffelex_token_
->where_col
= ffewhere_column_new (first_label_char
);
2164 ffelex_token_
->length
= labi
;
2165 ffelex_send_token_ ();
2166 ++ffelex_label_tokens_
;
2170 goto beginning_of_line
; /* :::::::::::::::::::: */
2172 /* Here is the main engine for parsing. c holds the character at column.
2173 It is already known that c is not a blank, end of line, or shriek,
2174 unless ffelex_raw_mode_ is not 0 (indicating we are in a
2175 character/hollerith constant). A partially filled token may already
2176 exist in ffelex_token_. One special case: if, when the end of the line
2177 is reached, continuation_line is FALSE and the only token on the line is
2178 END, then it is indeed the last statement. We don't look for
2179 continuation lines during this program unit in that case. This is
2180 according to ANSI. */
2182 if (ffelex_raw_mode_
!= 0)
2185 parse_raw_character
: /* :::::::::::::::::::: */
2189 ffewhereColumnNumber i
;
2191 if (ffelex_saw_tab_
|| (column
>= ffelex_final_nontab_column_
))
2192 goto beginning_of_line
; /* :::::::::::::::::::: */
2194 /* Pad out line with "virtual" spaces. */
2196 for (i
= column
; i
< ffelex_final_nontab_column_
; ++i
)
2197 ffelex_card_image_
[i
] = ' ';
2198 ffelex_card_image_
[i
] = '\0';
2199 ffelex_card_length_
= i
;
2203 switch (ffelex_raw_mode_
)
2206 c
= ffelex_backslash_ (c
, column
);
2210 if (!ffelex_backslash_reconsider_
)
2211 ffelex_append_to_token_ (c
);
2212 ffelex_raw_mode_
= -1;
2216 if (c
== ffelex_raw_char_
)
2218 ffelex_raw_mode_
= -1;
2219 ffelex_append_to_token_ (c
);
2223 ffelex_raw_mode_
= 0;
2224 ffelex_backslash_reconsider_
= TRUE
;
2229 if (c
== ffelex_raw_char_
)
2230 ffelex_raw_mode_
= -2;
2233 c
= ffelex_backslash_ (c
, column
);
2236 ffelex_raw_mode_
= -3;
2240 ffelex_append_to_token_ (c
);
2245 c
= ffelex_backslash_ (c
, column
);
2249 if (!ffelex_backslash_reconsider_
)
2251 ffelex_append_to_token_ (c
);
2257 if (ffelex_backslash_reconsider_
)
2258 ffelex_backslash_reconsider_
= FALSE
;
2260 c
= ffelex_card_image_
[++column
];
2262 if (ffelex_raw_mode_
== 0)
2264 ffelex_send_token_ ();
2265 assert (ffelex_raw_mode_
== 0);
2267 c
= ffelex_card_image_
[++column
];
2271 && (ffelex_card_image_
[column
+ 1] == '*')))
2272 goto beginning_of_line
; /* :::::::::::::::::::: */
2273 goto parse_nonraw_character
; /* :::::::::::::::::::: */
2275 goto parse_raw_character
; /* :::::::::::::::::::: */
2278 parse_nonraw_character
: /* :::::::::::::::::::: */
2280 switch (ffelex_token_
->type
)
2282 case FFELEX_typeNONE
:
2286 ffelex_token_
->type
= FFELEX_typeQUOTE
;
2287 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2288 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2289 ffelex_send_token_ ();
2293 ffelex_token_
->type
= FFELEX_typeDOLLAR
;
2294 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2295 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2296 ffelex_send_token_ ();
2300 ffelex_token_
->type
= FFELEX_typePERCENT
;
2301 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2302 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2303 ffelex_send_token_ ();
2307 ffelex_token_
->type
= FFELEX_typeAMPERSAND
;
2308 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2309 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2310 ffelex_send_token_ ();
2314 ffelex_token_
->type
= FFELEX_typeAPOSTROPHE
;
2315 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2316 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2317 ffelex_send_token_ ();
2321 ffelex_token_
->type
= FFELEX_typeOPEN_PAREN
;
2322 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2323 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2327 ffelex_token_
->type
= FFELEX_typeCLOSE_PAREN
;
2328 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2329 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2330 ffelex_send_token_ ();
2334 ffelex_token_
->type
= FFELEX_typeASTERISK
;
2335 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2336 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2340 ffelex_token_
->type
= FFELEX_typePLUS
;
2341 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2342 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2343 ffelex_send_token_ ();
2347 ffelex_token_
->type
= FFELEX_typeCOMMA
;
2348 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2349 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2350 ffelex_send_token_ ();
2354 ffelex_token_
->type
= FFELEX_typeMINUS
;
2355 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2356 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2357 ffelex_send_token_ ();
2361 ffelex_token_
->type
= FFELEX_typePERIOD
;
2362 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2363 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2364 ffelex_send_token_ ();
2368 ffelex_token_
->type
= FFELEX_typeSLASH
;
2369 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2370 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2384 = ffelex_hexnum_
? FFELEX_typeNAME
: FFELEX_typeNUMBER
;
2385 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2386 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2387 ffelex_append_to_token_ (c
);
2391 ffelex_token_
->type
= FFELEX_typeCOLON
;
2392 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2393 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2397 ffelex_token_
->type
= FFELEX_typeSEMICOLON
;
2398 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2399 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2400 ffelex_permit_include_
= TRUE
;
2401 ffelex_send_token_ ();
2402 ffelex_permit_include_
= FALSE
;
2406 ffelex_token_
->type
= FFELEX_typeOPEN_ANGLE
;
2407 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2408 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2412 ffelex_token_
->type
= FFELEX_typeEQUALS
;
2413 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2414 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2418 ffelex_token_
->type
= FFELEX_typeCLOSE_ANGLE
;
2419 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2420 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2424 ffelex_token_
->type
= FFELEX_typeQUESTION
;
2425 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
2426 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2427 ffelex_send_token_ ();
2431 if (1 || ffe_is_90 ())
2433 ffelex_token_
->type
= FFELEX_typeUNDERSCORE
;
2434 ffelex_token_
->where_line
2435 = ffewhere_line_use (ffelex_current_wl_
);
2436 ffelex_token_
->where_col
2437 = ffewhere_column_new (column
+ 1);
2438 ffelex_send_token_ ();
2494 c
= ffesrc_char_source (c
);
2496 if (ffesrc_char_match_init (c
, 'H', 'h')
2497 && ffelex_expecting_hollerith_
!= 0)
2499 ffelex_raw_mode_
= ffelex_expecting_hollerith_
;
2500 ffelex_token_
->type
= FFELEX_typeHOLLERITH
;
2501 ffelex_token_
->where_line
= ffelex_raw_where_line_
;
2502 ffelex_token_
->where_col
= ffelex_raw_where_col_
;
2503 ffelex_raw_where_line_
= ffewhere_line_unknown ();
2504 ffelex_raw_where_col_
= ffewhere_column_unknown ();
2505 c
= ffelex_card_image_
[++column
];
2506 goto parse_raw_character
; /* :::::::::::::::::::: */
2511 ffelex_token_
->where_line
2512 = ffewhere_line_use (ffelex_token_
->currentnames_line
2513 = ffewhere_line_use (ffelex_current_wl_
));
2514 ffelex_token_
->where_col
2515 = ffewhere_column_use (ffelex_token_
->currentnames_col
2516 = ffewhere_column_new (column
+ 1));
2517 ffelex_token_
->type
= FFELEX_typeNAMES
;
2521 ffelex_token_
->where_line
2522 = ffewhere_line_use (ffelex_current_wl_
);
2523 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
2524 ffelex_token_
->type
= FFELEX_typeNAME
;
2526 ffelex_append_to_token_ (c
);
2530 ffelex_bad_1_ (FFEBAD_UNRECOGNIZED_CHARACTER
,
2531 ffelex_linecount_current_
, column
+ 1);
2532 ffelex_finish_statement_ ();
2533 disallow_continuation_line
= TRUE
;
2534 ignore_disallowed_continuation
= TRUE
;
2535 goto beginning_of_line_again
; /* :::::::::::::::::::: */
2539 case FFELEX_typeNAME
:
2594 c
= ffesrc_char_source (c
);
2609 && !ffe_is_dollar_ok ())
2611 ffelex_send_token_ ();
2612 goto parse_next_character
; /* :::::::::::::::::::: */
2614 ffelex_append_to_token_ (c
);
2618 ffelex_send_token_ ();
2619 goto parse_next_character
; /* :::::::::::::::::::: */
2623 case FFELEX_typeNAMES
:
2678 c
= ffesrc_char_source (c
);
2693 && !ffe_is_dollar_ok ())
2695 ffelex_send_token_ ();
2696 goto parse_next_character
; /* :::::::::::::::::::: */
2698 if (ffelex_token_
->length
< FFEWHERE_indexMAX
)
2700 ffewhere_track (&ffelex_token_
->currentnames_line
,
2701 &ffelex_token_
->currentnames_col
,
2702 ffelex_token_
->wheretrack
,
2703 ffelex_token_
->length
,
2704 ffelex_linecount_current_
,
2707 ffelex_append_to_token_ (c
);
2711 ffelex_send_token_ ();
2712 goto parse_next_character
; /* :::::::::::::::::::: */
2716 case FFELEX_typeNUMBER
:
2729 ffelex_append_to_token_ (c
);
2733 ffelex_send_token_ ();
2734 goto parse_next_character
; /* :::::::::::::::::::: */
2738 case FFELEX_typeASTERISK
:
2742 ffelex_token_
->type
= FFELEX_typePOWER
;
2743 ffelex_send_token_ ();
2746 default: /* * not followed by another *. */
2747 ffelex_send_token_ ();
2748 goto parse_next_character
; /* :::::::::::::::::::: */
2752 case FFELEX_typeCOLON
:
2756 ffelex_token_
->type
= FFELEX_typeCOLONCOLON
;
2757 ffelex_send_token_ ();
2760 default: /* : not followed by another :. */
2761 ffelex_send_token_ ();
2762 goto parse_next_character
; /* :::::::::::::::::::: */
2766 case FFELEX_typeSLASH
:
2770 ffelex_token_
->type
= FFELEX_typeCONCAT
;
2771 ffelex_send_token_ ();
2775 ffelex_token_
->type
= FFELEX_typeCLOSE_ARRAY
;
2776 ffelex_send_token_ ();
2780 ffelex_token_
->type
= FFELEX_typeREL_NE
;
2781 ffelex_send_token_ ();
2785 ffelex_send_token_ ();
2786 goto parse_next_character
; /* :::::::::::::::::::: */
2790 case FFELEX_typeOPEN_PAREN
:
2794 ffelex_token_
->type
= FFELEX_typeOPEN_ARRAY
;
2795 ffelex_send_token_ ();
2799 ffelex_send_token_ ();
2800 goto parse_next_character
; /* :::::::::::::::::::: */
2804 case FFELEX_typeOPEN_ANGLE
:
2808 ffelex_token_
->type
= FFELEX_typeREL_LE
;
2809 ffelex_send_token_ ();
2813 ffelex_send_token_ ();
2814 goto parse_next_character
; /* :::::::::::::::::::: */
2818 case FFELEX_typeEQUALS
:
2822 ffelex_token_
->type
= FFELEX_typeREL_EQ
;
2823 ffelex_send_token_ ();
2827 ffelex_token_
->type
= FFELEX_typePOINTS
;
2828 ffelex_send_token_ ();
2832 ffelex_send_token_ ();
2833 goto parse_next_character
; /* :::::::::::::::::::: */
2837 case FFELEX_typeCLOSE_ANGLE
:
2841 ffelex_token_
->type
= FFELEX_typeREL_GE
;
2842 ffelex_send_token_ ();
2846 ffelex_send_token_ ();
2847 goto parse_next_character
; /* :::::::::::::::::::: */
2852 assert ("Serious error!!" == NULL
);
2857 c
= ffelex_card_image_
[++column
];
2859 parse_next_character
: /* :::::::::::::::::::: */
2861 if (ffelex_raw_mode_
!= 0)
2862 goto parse_raw_character
; /* :::::::::::::::::::: */
2865 c
= ffelex_card_image_
[++column
];
2870 && (ffelex_card_image_
[column
+ 1] == '*')))
2872 if ((ffelex_number_of_tokens_
== ffelex_label_tokens_
)
2873 && (ffelex_token_
->type
== FFELEX_typeNAMES
)
2874 && (ffelex_token_
->length
== 3)
2875 && (ffesrc_strncmp_2c (ffe_case_match (),
2876 ffelex_token_
->text
,
2877 "END", "end", "End",
2881 ffelex_finish_statement_ ();
2882 disallow_continuation_line
= TRUE
;
2883 ignore_disallowed_continuation
= FALSE
;
2884 goto beginning_of_line_again
; /* :::::::::::::::::::: */
2886 goto beginning_of_line
; /* :::::::::::::::::::: */
2888 goto parse_nonraw_character
; /* :::::::::::::::::::: */
2891 /* ffelex_file_free -- Lex a given file in free source form
2895 ffelex_file_free(wf,f);
2897 Lexes the file according to Fortran 90 ANSI + VXT specifications. */
2900 ffelex_file_free (ffewhereFile wf
, FILE *f
)
2902 register int c
= 0; /* Character currently under consideration. */
2903 register ffewhereColumnNumber column
= 0; /* Not really; 0 means column 1... */
2904 bool continuation_line
= FALSE
;
2905 ffewhereColumnNumber continuation_column
;
2906 int latest_char_in_file
= 0; /* For getting back into comment-skipping
2909 /* Lex is called for a particular file, not for a particular program unit.
2910 Yet the two events do share common characteristics. The first line in a
2911 file or in a program unit cannot be a continuation line. No token can
2912 be in mid-formation. No current label for the statement exists, since
2913 there is no current statement. */
2915 assert (ffelex_handler_
!= NULL
);
2918 input_filename
= ffewhere_file_name (wf
);
2919 ffelex_current_wf_
= wf
;
2920 continuation_line
= FALSE
;
2921 ffelex_token_
->type
= FFELEX_typeNONE
;
2922 ffelex_number_of_tokens_
= 0;
2923 ffelex_current_wl_
= ffewhere_line_unknown ();
2924 ffelex_current_wc_
= ffewhere_column_unknown ();
2925 latest_char_in_file
= '\n';
2927 /* Come here to get a new line. */
2929 beginning_of_line
: /* :::::::::::::::::::: */
2931 c
= latest_char_in_file
;
2932 if ((c
== EOF
) || ((c
= ffelex_getc_ (f
)) == EOF
))
2935 end_of_file
: /* :::::::::::::::::::: */
2937 /* Line ending in EOF instead of \n still counts as a whole line. */
2939 ffelex_finish_statement_ ();
2940 ffewhere_line_kill (ffelex_current_wl_
);
2941 ffewhere_column_kill (ffelex_current_wc_
);
2942 return (ffelexHandler
) ffelex_handler_
;
2945 ffelex_next_line_ ();
2947 ffelex_bad_line_
= FALSE
;
2949 /* Skip over initial-comment and empty lines as quickly as possible! */
2956 c
= ffelex_hash_ (f
);
2958 comment_line
: /* :::::::::::::::::::: */
2960 while ((c
!= '\n') && (c
!= EOF
))
2965 ffelex_next_line_ ();
2966 goto end_of_file
; /* :::::::::::::::::::: */
2971 ffelex_next_line_ ();
2974 goto end_of_file
; /* :::::::::::::::::::: */
2977 ffelex_saw_tab_
= FALSE
;
2979 column
= ffelex_image_char_ (c
, 0);
2981 /* Read the entire line in as is (with whitespace processing). */
2983 while (((c
= getc (f
)) != '\n') && (c
!= EOF
))
2984 column
= ffelex_image_char_ (c
, column
);
2986 if (ffelex_bad_line_
)
2988 ffelex_card_image_
[column
] = '\0';
2989 ffelex_card_length_
= column
;
2990 goto comment_line
; /* :::::::::::::::::::: */
2993 /* If no tab, cut off line after column 132. */
2995 if (!ffelex_saw_tab_
&& (column
> FFELEX_FREE_MAX_COLUMNS_
))
2996 column
= FFELEX_FREE_MAX_COLUMNS_
;
2998 ffelex_card_image_
[column
] = '\0';
2999 ffelex_card_length_
= column
;
3001 /* Save next char in file so we can use register-based c while analyzing
3002 line we just read. */
3004 latest_char_in_file
= c
; /* Should be either '\n' or EOF. */
3007 continuation_column
= 0;
3009 /* Skip over initial spaces to see if the first nonblank character
3010 is exclamation point, newline, or EOF (line is therefore a comment) or
3011 ampersand (line is therefore a continuation line). */
3013 while ((c
= ffelex_card_image_
[column
]) == ' ')
3020 goto beginning_of_line
; /* :::::::::::::::::::: */
3023 continuation_column
= column
+ 1;
3030 /* The line definitely has content of some kind, install new end-statement
3031 point for error messages. */
3033 ffewhere_line_kill (ffelex_current_wl_
);
3034 ffewhere_column_kill (ffelex_current_wc_
);
3035 ffelex_current_wl_
= ffewhere_line_new (ffelex_linecount_current_
);
3036 ffelex_current_wc_
= ffewhere_column_new (ffelex_card_length_
+ 1);
3038 /* Figure out which column to start parsing at. */
3040 if (continuation_line
)
3042 if (continuation_column
== 0)
3044 if (ffelex_raw_mode_
!= 0)
3046 ffelex_bad_1_ (FFEBAD_BAD_CHAR_CONTINUE
,
3047 ffelex_linecount_current_
, column
+ 1);
3049 else if (ffelex_token_
->type
!= FFELEX_typeNONE
)
3051 ffelex_bad_1_ (FFEBAD_BAD_LEXTOK_CONTINUE
,
3052 ffelex_linecount_current_
, column
+ 1);
3055 else if (ffelex_is_free_char_ctx_contin_ (continuation_column
))
3056 { /* Line contains only a single "&" as only
3057 nonblank character. */
3058 ffelex_bad_1_ (FFEBAD_BAD_FREE_CONTINUE
,
3059 ffelex_linecount_current_
, continuation_column
);
3060 goto beginning_of_line
; /* :::::::::::::::::::: */
3062 column
= continuation_column
;
3067 c
= ffelex_card_image_
[column
];
3068 continuation_line
= FALSE
;
3070 /* Here is the main engine for parsing. c holds the character at column.
3071 It is already known that c is not a blank, end of line, or shriek,
3072 unless ffelex_raw_mode_ is not 0 (indicating we are in a
3073 character/hollerith constant). A partially filled token may already
3074 exist in ffelex_token_. */
3076 if (ffelex_raw_mode_
!= 0)
3079 parse_raw_character
: /* :::::::::::::::::::: */
3084 if (ffelex_is_free_char_ctx_contin_ (column
+ 1))
3086 continuation_line
= TRUE
;
3087 goto beginning_of_line
; /* :::::::::::::::::::: */
3092 ffelex_finish_statement_ ();
3093 goto beginning_of_line
; /* :::::::::::::::::::: */
3099 switch (ffelex_raw_mode_
)
3102 c
= ffelex_backslash_ (c
, column
);
3106 if (!ffelex_backslash_reconsider_
)
3107 ffelex_append_to_token_ (c
);
3108 ffelex_raw_mode_
= -1;
3112 if (c
== ffelex_raw_char_
)
3114 ffelex_raw_mode_
= -1;
3115 ffelex_append_to_token_ (c
);
3119 ffelex_raw_mode_
= 0;
3120 ffelex_backslash_reconsider_
= TRUE
;
3125 if (c
== ffelex_raw_char_
)
3126 ffelex_raw_mode_
= -2;
3129 c
= ffelex_backslash_ (c
, column
);
3132 ffelex_raw_mode_
= -3;
3136 ffelex_append_to_token_ (c
);
3141 c
= ffelex_backslash_ (c
, column
);
3145 if (!ffelex_backslash_reconsider_
)
3147 ffelex_append_to_token_ (c
);
3153 if (ffelex_backslash_reconsider_
)
3154 ffelex_backslash_reconsider_
= FALSE
;
3156 c
= ffelex_card_image_
[++column
];
3158 if (ffelex_raw_mode_
== 0)
3160 ffelex_send_token_ ();
3161 assert (ffelex_raw_mode_
== 0);
3163 c
= ffelex_card_image_
[++column
];
3164 if ((c
== '\0') || (c
== '!'))
3166 ffelex_finish_statement_ ();
3167 goto beginning_of_line
; /* :::::::::::::::::::: */
3169 if ((c
== '&') && ffelex_is_free_nonc_ctx_contin_ (column
+ 1))
3171 continuation_line
= TRUE
;
3172 goto beginning_of_line
; /* :::::::::::::::::::: */
3174 goto parse_nonraw_character_noncontin
; /* :::::::::::::::::::: */
3176 goto parse_raw_character
; /* :::::::::::::::::::: */
3179 parse_nonraw_character
: /* :::::::::::::::::::: */
3181 if ((c
== '&') && ffelex_is_free_nonc_ctx_contin_ (column
+ 1))
3183 continuation_line
= TRUE
;
3184 goto beginning_of_line
; /* :::::::::::::::::::: */
3187 parse_nonraw_character_noncontin
: /* :::::::::::::::::::: */
3189 switch (ffelex_token_
->type
)
3191 case FFELEX_typeNONE
:
3194 finish-statement/continue-statement
3197 c
= ffelex_card_image_
[++column
];
3198 if ((c
== '\0') || (c
== '!'))
3200 ffelex_finish_statement_ ();
3201 goto beginning_of_line
; /* :::::::::::::::::::: */
3203 if ((c
== '&') && ffelex_is_free_nonc_ctx_contin_ (column
+ 1))
3205 continuation_line
= TRUE
;
3206 goto beginning_of_line
; /* :::::::::::::::::::: */
3213 ffelex_token_
->type
= FFELEX_typeQUOTE
;
3214 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3215 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3216 ffelex_send_token_ ();
3220 ffelex_token_
->type
= FFELEX_typeDOLLAR
;
3221 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3222 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3223 ffelex_send_token_ ();
3227 ffelex_token_
->type
= FFELEX_typePERCENT
;
3228 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3229 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3230 ffelex_send_token_ ();
3234 ffelex_token_
->type
= FFELEX_typeAMPERSAND
;
3235 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3236 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3237 ffelex_send_token_ ();
3241 ffelex_token_
->type
= FFELEX_typeAPOSTROPHE
;
3242 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3243 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3244 ffelex_send_token_ ();
3248 ffelex_token_
->type
= FFELEX_typeOPEN_PAREN
;
3249 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3250 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3254 ffelex_token_
->type
= FFELEX_typeCLOSE_PAREN
;
3255 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3256 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3257 ffelex_send_token_ ();
3261 ffelex_token_
->type
= FFELEX_typeASTERISK
;
3262 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3263 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3267 ffelex_token_
->type
= FFELEX_typePLUS
;
3268 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3269 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3270 ffelex_send_token_ ();
3274 ffelex_token_
->type
= FFELEX_typeCOMMA
;
3275 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3276 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3277 ffelex_send_token_ ();
3281 ffelex_token_
->type
= FFELEX_typeMINUS
;
3282 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3283 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3284 ffelex_send_token_ ();
3288 ffelex_token_
->type
= FFELEX_typePERIOD
;
3289 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3290 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3291 ffelex_send_token_ ();
3295 ffelex_token_
->type
= FFELEX_typeSLASH
;
3296 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3297 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3311 = ffelex_hexnum_
? FFELEX_typeNAME
: FFELEX_typeNUMBER
;
3312 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3313 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3314 ffelex_append_to_token_ (c
);
3318 ffelex_token_
->type
= FFELEX_typeCOLON
;
3319 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3320 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3324 ffelex_token_
->type
= FFELEX_typeSEMICOLON
;
3325 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3326 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3327 ffelex_permit_include_
= TRUE
;
3328 ffelex_send_token_ ();
3329 ffelex_permit_include_
= FALSE
;
3333 ffelex_token_
->type
= FFELEX_typeOPEN_ANGLE
;
3334 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3335 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3339 ffelex_token_
->type
= FFELEX_typeEQUALS
;
3340 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3341 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3345 ffelex_token_
->type
= FFELEX_typeCLOSE_ANGLE
;
3346 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3347 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3351 ffelex_token_
->type
= FFELEX_typeQUESTION
;
3352 ffelex_token_
->where_line
= ffewhere_line_use (ffelex_current_wl_
);
3353 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3354 ffelex_send_token_ ();
3358 if (1 || ffe_is_90 ())
3360 ffelex_token_
->type
= FFELEX_typeUNDERSCORE
;
3361 ffelex_token_
->where_line
3362 = ffewhere_line_use (ffelex_current_wl_
);
3363 ffelex_token_
->where_col
3364 = ffewhere_column_new (column
+ 1);
3365 ffelex_send_token_ ();
3421 c
= ffesrc_char_source (c
);
3423 if (ffesrc_char_match_init (c
, 'H', 'h')
3424 && ffelex_expecting_hollerith_
!= 0)
3426 ffelex_raw_mode_
= ffelex_expecting_hollerith_
;
3427 ffelex_token_
->type
= FFELEX_typeHOLLERITH
;
3428 ffelex_token_
->where_line
= ffelex_raw_where_line_
;
3429 ffelex_token_
->where_col
= ffelex_raw_where_col_
;
3430 ffelex_raw_where_line_
= ffewhere_line_unknown ();
3431 ffelex_raw_where_col_
= ffewhere_column_unknown ();
3432 c
= ffelex_card_image_
[++column
];
3433 goto parse_raw_character
; /* :::::::::::::::::::: */
3436 if (ffelex_names_pure_
)
3438 ffelex_token_
->where_line
3439 = ffewhere_line_use (ffelex_token_
->currentnames_line
3440 = ffewhere_line_use (ffelex_current_wl_
));
3441 ffelex_token_
->where_col
3442 = ffewhere_column_use (ffelex_token_
->currentnames_col
3443 = ffewhere_column_new (column
+ 1));
3444 ffelex_token_
->type
= FFELEX_typeNAMES
;
3448 ffelex_token_
->where_line
3449 = ffewhere_line_use (ffelex_current_wl_
);
3450 ffelex_token_
->where_col
= ffewhere_column_new (column
+ 1);
3451 ffelex_token_
->type
= FFELEX_typeNAME
;
3453 ffelex_append_to_token_ (c
);
3457 ffelex_bad_1_ (FFEBAD_UNRECOGNIZED_CHARACTER
,
3458 ffelex_linecount_current_
, column
+ 1);
3459 ffelex_finish_statement_ ();
3460 goto beginning_of_line
; /* :::::::::::::::::::: */
3464 case FFELEX_typeNAME
:
3519 c
= ffesrc_char_source (c
);
3534 && !ffe_is_dollar_ok ())
3536 ffelex_send_token_ ();
3537 goto parse_next_character
; /* :::::::::::::::::::: */
3539 ffelex_append_to_token_ (c
);
3543 ffelex_send_token_ ();
3544 goto parse_next_character
; /* :::::::::::::::::::: */
3548 case FFELEX_typeNAMES
:
3603 c
= ffesrc_char_source (c
);
3618 && !ffe_is_dollar_ok ())
3620 ffelex_send_token_ ();
3621 goto parse_next_character
; /* :::::::::::::::::::: */
3623 if (ffelex_token_
->length
< FFEWHERE_indexMAX
)
3625 ffewhere_track (&ffelex_token_
->currentnames_line
,
3626 &ffelex_token_
->currentnames_col
,
3627 ffelex_token_
->wheretrack
,
3628 ffelex_token_
->length
,
3629 ffelex_linecount_current_
,
3632 ffelex_append_to_token_ (c
);
3636 ffelex_send_token_ ();
3637 goto parse_next_character
; /* :::::::::::::::::::: */
3641 case FFELEX_typeNUMBER
:
3654 ffelex_append_to_token_ (c
);
3658 ffelex_send_token_ ();
3659 goto parse_next_character
; /* :::::::::::::::::::: */
3663 case FFELEX_typeASTERISK
:
3667 ffelex_token_
->type
= FFELEX_typePOWER
;
3668 ffelex_send_token_ ();
3671 default: /* * not followed by another *. */
3672 ffelex_send_token_ ();
3673 goto parse_next_character
; /* :::::::::::::::::::: */
3677 case FFELEX_typeCOLON
:
3681 ffelex_token_
->type
= FFELEX_typeCOLONCOLON
;
3682 ffelex_send_token_ ();
3685 default: /* : not followed by another :. */
3686 ffelex_send_token_ ();
3687 goto parse_next_character
; /* :::::::::::::::::::: */
3691 case FFELEX_typeSLASH
:
3695 ffelex_token_
->type
= FFELEX_typeCONCAT
;
3696 ffelex_send_token_ ();
3700 ffelex_token_
->type
= FFELEX_typeCLOSE_ARRAY
;
3701 ffelex_send_token_ ();
3705 ffelex_token_
->type
= FFELEX_typeREL_NE
;
3706 ffelex_send_token_ ();
3710 ffelex_send_token_ ();
3711 goto parse_next_character
; /* :::::::::::::::::::: */
3715 case FFELEX_typeOPEN_PAREN
:
3719 ffelex_token_
->type
= FFELEX_typeOPEN_ARRAY
;
3720 ffelex_send_token_ ();
3724 ffelex_send_token_ ();
3725 goto parse_next_character
; /* :::::::::::::::::::: */
3729 case FFELEX_typeOPEN_ANGLE
:
3733 ffelex_token_
->type
= FFELEX_typeREL_LE
;
3734 ffelex_send_token_ ();
3738 ffelex_send_token_ ();
3739 goto parse_next_character
; /* :::::::::::::::::::: */
3743 case FFELEX_typeEQUALS
:
3747 ffelex_token_
->type
= FFELEX_typeREL_EQ
;
3748 ffelex_send_token_ ();
3752 ffelex_token_
->type
= FFELEX_typePOINTS
;
3753 ffelex_send_token_ ();
3757 ffelex_send_token_ ();
3758 goto parse_next_character
; /* :::::::::::::::::::: */
3762 case FFELEX_typeCLOSE_ANGLE
:
3766 ffelex_token_
->type
= FFELEX_typeREL_GE
;
3767 ffelex_send_token_ ();
3771 ffelex_send_token_ ();
3772 goto parse_next_character
; /* :::::::::::::::::::: */
3777 assert ("Serious error!" == NULL
);
3782 c
= ffelex_card_image_
[++column
];
3784 parse_next_character
: /* :::::::::::::::::::: */
3786 if (ffelex_raw_mode_
!= 0)
3787 goto parse_raw_character
; /* :::::::::::::::::::: */
3789 if ((c
== '\0') || (c
== '!'))
3791 ffelex_finish_statement_ ();
3792 goto beginning_of_line
; /* :::::::::::::::::::: */
3794 goto parse_nonraw_character
; /* :::::::::::::::::::: */
3797 /* See the code in com.c that calls this to understand why. */
3800 ffelex_hash_kludge (FILE *finput
)
3802 /* If you change this constant string, you have to change whatever
3803 code might thus be affected by it in terms of having to use
3804 ffelex_getc_() instead of getc() in the lexers and _hash_. */
3805 static const char match
[] = "# 1 \"";
3806 static int kludge
[ARRAY_SIZE (match
) + 1];
3811 /* Read chars as long as they match the target string.
3812 Copy them into an array that will serve as a record
3813 of what we read (essentially a multi-char ungetc(),
3814 for code that uses ffelex_getc_ instead of getc() elsewhere
3816 for (p
= &match
[0], q
= &kludge
[0], c
= getc (finput
);
3817 (c
== *p
) && (*p
!= '\0') && (c
!= EOF
);
3818 ++p
, ++q
, c
= getc (finput
))
3821 *q
= c
; /* Might be EOF, which requires int. */
3824 ffelex_kludge_chars_
= &kludge
[0];
3828 ffelex_kludge_flag_
= TRUE
;
3829 ++ffelex_kludge_chars_
;
3830 ffelex_hash_ (finput
); /* Handle it NOW rather than later. */
3831 ffelex_kludge_flag_
= FALSE
;
3836 ffelex_init_1 (void)
3840 ffelex_final_nontab_column_
= ffe_fixed_line_length ();
3841 ffelex_card_size_
= FFELEX_columnINITIAL_SIZE_
;
3842 ffelex_card_image_
= malloc_new_ksr (malloc_pool_image (),
3843 "FFELEX card image",
3844 FFELEX_columnINITIAL_SIZE_
+ 9);
3845 ffelex_card_image_
[0] = '\0';
3847 for (i
= 0; i
< 256; ++i
)
3848 ffelex_first_char_
[i
] = FFELEX_typeERROR
;
3850 ffelex_first_char_
['\t'] = FFELEX_typeRAW
;
3851 ffelex_first_char_
['\n'] = FFELEX_typeCOMMENT
;
3852 ffelex_first_char_
['\v'] = FFELEX_typeCOMMENT
;
3853 ffelex_first_char_
['\f'] = FFELEX_typeCOMMENT
;
3854 ffelex_first_char_
['\r'] = FFELEX_typeRAW
;
3855 ffelex_first_char_
[' '] = FFELEX_typeRAW
;
3856 ffelex_first_char_
['!'] = FFELEX_typeCOMMENT
;
3857 ffelex_first_char_
['*'] = FFELEX_typeCOMMENT
;
3858 ffelex_first_char_
['/'] = FFELEX_typeSLASH
;
3859 ffelex_first_char_
['&'] = FFELEX_typeRAW
;
3860 ffelex_first_char_
['#'] = FFELEX_typeHASH
;
3862 for (i
= '0'; i
<= '9'; ++i
)
3863 ffelex_first_char_
[i
] = FFELEX_typeRAW
;
3865 if ((ffe_case_match () == FFE_caseNONE
)
3866 || ((ffe_case_match () == FFE_caseUPPER
)
3867 && (ffe_case_source () != FFE_caseLOWER
)) /* Idiot! :-) */
3868 || ((ffe_case_match () == FFE_caseLOWER
)
3869 && (ffe_case_source () == FFE_caseLOWER
)))
3871 ffelex_first_char_
['C'] = FFELEX_typeCOMMENT
;
3872 ffelex_first_char_
['D'] = FFELEX_typeCOMMENT
;
3874 if ((ffe_case_match () == FFE_caseNONE
)
3875 || ((ffe_case_match () == FFE_caseLOWER
)
3876 && (ffe_case_source () != FFE_caseUPPER
)) /* Idiot! :-) */
3877 || ((ffe_case_match () == FFE_caseUPPER
)
3878 && (ffe_case_source () == FFE_caseUPPER
)))
3880 ffelex_first_char_
['c'] = FFELEX_typeCOMMENT
;
3881 ffelex_first_char_
['d'] = FFELEX_typeCOMMENT
;
3884 ffelex_linecount_current_
= 0;
3885 ffelex_linecount_next_
= 1;
3886 ffelex_raw_mode_
= 0;
3887 ffelex_set_include_
= FALSE
;
3888 ffelex_permit_include_
= FALSE
;
3889 ffelex_names_
= TRUE
; /* First token in program is a names. */
3890 ffelex_names_pure_
= FALSE
; /* Free-form lexer does NAMES only for
3892 ffelex_hexnum_
= FALSE
;
3893 ffelex_expecting_hollerith_
= 0;
3894 ffelex_raw_where_line_
= ffewhere_line_unknown ();
3895 ffelex_raw_where_col_
= ffewhere_column_unknown ();
3897 ffelex_token_
= ffelex_token_new_ ();
3898 ffelex_token_
->type
= FFELEX_typeNONE
;
3899 ffelex_token_
->uses
= 1;
3900 ffelex_token_
->where_line
= ffewhere_line_unknown ();
3901 ffelex_token_
->where_col
= ffewhere_column_unknown ();
3902 ffelex_token_
->text
= NULL
;
3904 ffelex_handler_
= NULL
;
3907 /* ffelex_is_names_expected -- Is the current parser expecting NAMES vs. NAME?
3909 if (ffelex_is_names_expected())
3910 // Deliver NAMES token
3912 // Deliver NAME token
3914 Must be called while lexer is active, obviously. */
3917 ffelex_is_names_expected (void)
3919 return ffelex_names_
;
3922 /* Current card image, which has the master linecount number
3923 ffelex_linecount_current_. */
3928 return ffelex_card_image_
;
3931 /* ffelex_line_length -- Return length of current lexer line
3933 printf("Length is %lu\n",ffelex_line_length());
3935 Must be called while lexer is active, obviously. */
3937 ffewhereColumnNumber
3938 ffelex_line_length (void)
3940 return ffelex_card_length_
;
3943 /* Master line count of current card image, or 0 if no card image
3947 ffelex_line_number (void)
3949 return ffelex_linecount_current_
;
3952 /* ffelex_set_expecting_hollerith -- Set hollerith expectation status
3954 ffelex_set_expecting_hollerith(0);
3956 Lex initially assumes no hollerith constant is about to show up. If
3957 syntactic analysis expects one, it should call this function with the
3958 number of characters expected in the constant immediately after recognizing
3959 the decimal number preceding the "H" and the constant itself. Then, if
3960 the next character is indeed H, the lexer will interpret it as beginning
3961 a hollerith constant and ship the token formed by reading the specified
3962 number of characters (interpreting blanks and otherwise-comments too)
3963 from the input file. It is up to syntactic analysis to call this routine
3964 again with 0 to turn hollerith detection off immediately upon receiving
3965 the token that might or might not be HOLLERITH.
3967 Also call this after seeing an APOSTROPHE or QUOTE token that begins a
3968 character constant. Pass the expected termination character (apostrophe
3971 Pass for length either the length of the hollerith (must be > 0), -1
3972 meaning expecting a character constant, or 0 to cancel expectation of
3973 a hollerith only after calling it with a length of > 0 and receiving the
3974 next token (which may or may not have been a HOLLERITH token).
3976 Pass for which either an apostrophe or quote when passing length of -1.
3977 Else which is a don't-care.
3979 Pass for line and column the line/column info for the token beginning the
3980 character or hollerith constant, for use in error messages, when passing
3981 a length of -1 -- this function will invoke ffewhere_line/column_use to
3982 make its own copies. Else line and column are don't-cares (when length
3983 is 0) and the outstanding copies of the previous line/column info, if
3984 still around, are killed.
3987 When called with length of 0, also zero ffelex_raw_mode_. This is
3988 so ffest_save_ can undo the effects of replaying tokens like
3989 APOSTROPHE and QUOTE.
3991 New line, column arguments allow error messages to point to the true
3992 beginning of a character/hollerith constant, rather than the beginning
3993 of the content part, which makes them more consistent and helpful.
3995 New "which" argument allows caller to specify termination character,
3996 which should be apostrophe or double-quote, to support Fortran 90. */
3999 ffelex_set_expecting_hollerith (long length
, char which
,
4000 ffewhereLine line
, ffewhereColumn column
)
4003 /* First kill the pending line/col info, if any (should only be pending
4004 when this call has length==0, the previous call had length>0, and a
4005 non-HOLLERITH token was sent in between the calls, but play it safe). */
4007 ffewhere_line_kill (ffelex_raw_where_line_
);
4008 ffewhere_column_kill (ffelex_raw_where_col_
);
4010 /* Now handle the length function. */
4014 ffelex_expecting_hollerith_
= 0;
4015 ffelex_raw_mode_
= 0;
4016 ffelex_raw_where_line_
= ffewhere_line_unknown ();
4017 ffelex_raw_where_col_
= ffewhere_column_unknown ();
4018 return; /* Don't set new line/column info from args. */
4021 ffelex_raw_mode_
= -1;
4022 ffelex_raw_char_
= which
;
4025 default: /* length > 0 */
4026 ffelex_expecting_hollerith_
= length
;
4030 /* Now set new line/column information from passed args. */
4032 ffelex_raw_where_line_
= ffewhere_line_use (line
);
4033 ffelex_raw_where_col_
= ffewhere_column_use (column
);
4036 /* ffelex_set_handler -- Set handler for tokens before calling _fixed or _free
4038 ffelex_set_handler((ffelexHandler) my_first_handler);
4040 Must be called before calling ffelex_file_fixed or ffelex_file_free or
4041 after they return, but not while they are active. */
4044 ffelex_set_handler (ffelexHandler first
)
4046 ffelex_handler_
= first
;
4049 /* ffelex_set_hexnum -- Set hexnum flag
4051 ffelex_set_hexnum(TRUE);
4053 Lex normally interprets a token starting with [0-9] as a NUMBER token,
4054 so if it sees a [A-Za-z] in it, it stops parsing the NUMBER and leaves
4055 the character as the first of the next token. But when parsing a
4056 hexadecimal number, by calling this function with TRUE before starting
4057 the parse of the token itself, lex will interpret [0-9] as the start
4061 ffelex_set_hexnum (bool f
)
4066 /* ffelex_set_include -- Set INCLUDE file to be processed next
4068 ffewhereFile wf; // The ffewhereFile object for the file.
4069 bool free_form; // TRUE means read free-form file, FALSE fixed-form.
4070 FILE *fi; // The file to INCLUDE.
4071 ffelex_set_include(wf,free_form,fi);
4073 Must be called only after receiving the EOS token following a valid
4074 INCLUDE statement specifying a file that has already been successfully
4078 ffelex_set_include (ffewhereFile wf
, bool free_form
, FILE *fi
)
4080 assert (ffelex_permit_include_
);
4081 assert (!ffelex_set_include_
);
4082 ffelex_set_include_
= TRUE
;
4083 ffelex_include_free_form_
= free_form
;
4084 ffelex_include_file_
= fi
;
4085 ffelex_include_wherefile_
= wf
;
4088 /* ffelex_set_names -- Set names/name flag, names = TRUE
4090 ffelex_set_names(FALSE);
4092 Lex initially assumes multiple names should be formed. If this function is
4093 called with FALSE, then single names are formed instead. The differences
4094 are a difference in the token type (FFELEX_typeNAMES vs. FFELEX_typeNAME)
4095 and in whether full source-location tracking is performed (it is for
4096 multiple names, not for single names), which is more expensive in terms of
4100 ffelex_set_names (bool f
)
4104 ffelex_names_pure_
= FALSE
;
4107 /* ffelex_set_names_pure -- Set names/name (pure) flag, names = TRUE
4109 ffelex_set_names_pure(FALSE);
4111 Like ffelex_set_names, except affects both lexers. Normally, the
4112 free-form lexer need not generate NAMES tokens because adjacent NAME
4113 tokens must be separated by spaces which causes the lexer to generate
4114 separate tokens for analysis (whereas in fixed-form the spaces are
4115 ignored resulting in one long token). But in FORMAT statements, for
4116 some reason, the Fortran 90 standard specifies that spaces can occur
4117 anywhere within a format-item-list with no effect on the format spec
4118 (except of course within character string edit descriptors), which means
4119 that "1PE14.2" and "1 P E 1 4 . 2" are equivalent. For the FORMAT
4120 statement handling, the existence of spaces makes it hard to deal with,
4121 because each token is seen distinctly (i.e. seven tokens in the latter
4122 example). But when no spaces are provided, as in the former example,
4123 then only four tokens are generated, NUMBER("1"), NAME("PE14"), PERIOD,
4124 NUMBER ("2"). By generating a NAMES instead of NAME, three things happen:
4125 One, ffest_kw_format_ does a substring rather than full-string match,
4126 and thus matches "PE14" to "PE"; two, ffelex_token_xyz_from_names functions
4127 may be used to pull NAME/NAMES and NUMBER tokens out of the NAMES token;
4128 and three, error reporting can point to the actual character rather than
4129 at or prior to it. The first two things could be resolved by providing
4130 alternate functions fairly easy, thus allowing FORMAT handling to expect
4131 both lexers to generate NAME tokens instead of NAMES (with otherwise minor
4132 changes to FORMAT parsing), but the third, error reporting, would suffer,
4133 and when one makes mistakes in a FORMAT, believe me, one wants a pointer
4134 to exactly where the compilers thinks the problem is, to even begin to get
4135 a handle on it. So there. */
4138 ffelex_set_names_pure (bool f
)
4140 ffelex_names_pure_
= f
;
4144 /* ffelex_splice_tokens -- Splice off and send tokens from a NAMES
4146 return (ffelexHandler) ffelex_splice_tokens(first_handler,master_token,
4149 Returns first_handler if start_char_index chars into master_token (which
4150 must be a NAMES token) is '\0'. Else, creates a subtoken from that
4151 char, either NUMBER (if it is a digit), a NAME (if a valid firstnamechar),
4152 an UNDERSCORE (if an underscore), or DOLLAR (if a dollar sign)
4153 and sends it to first_handler. If anything other than NAME is sent, the
4154 character at the end of it in the master token is examined to see if it
4155 begins a NAME, NUMBER, UNDERSCORE, or DOLLAR, and, if so,
4156 the handler returned by first_handler is invoked with that token, and
4157 this process is repeated until the end of the master token or a NAME
4158 token is reached. */
4161 ffelex_splice_tokens (ffelexHandler first
, ffelexToken master
,
4162 ffeTokenLength start
)
4168 p
= ffelex_token_text (master
) + (i
= start
);
4174 t
= ffelex_token_number_from_names (master
, i
);
4175 p
+= ffelex_token_length (t
);
4176 i
+= ffelex_token_length (t
);
4178 else if (ffesrc_is_name_init (*p
))
4180 t
= ffelex_token_name_from_names (master
, i
, 0);
4181 p
+= ffelex_token_length (t
);
4182 i
+= ffelex_token_length (t
);
4186 t
= ffelex_token_dollar_from_names (master
, i
);
4192 t
= ffelex_token_uscore_from_names (master
, i
);
4198 assert ("not a valid NAMES character" == NULL
);
4201 assert (first
!= NULL
);
4202 first
= (ffelexHandler
) (*first
) (t
);
4203 ffelex_token_kill (t
);
4209 /* ffelex_swallow_tokens -- Eat all tokens delivered to me
4211 return ffelex_swallow_tokens;
4213 Return this handler when you don't want to look at any more tokens in the
4214 statement because you've encountered an unrecoverable error in the
4218 ffelex_swallow_tokens (ffelexToken t
, ffelexHandler handler
)
4220 assert (handler
!= NULL
);
4222 if ((t
!= NULL
) && ((ffelex_token_type (t
) == FFELEX_typeEOS
)
4223 || (ffelex_token_type (t
) == FFELEX_typeSEMICOLON
)))
4224 return (ffelexHandler
) (*handler
) (t
);
4226 ffelex_eos_handler_
= handler
;
4227 return (ffelexHandler
) ffelex_swallow_tokens_
;
4230 /* ffelex_token_dollar_from_names -- Return a dollar from within a names token
4233 t = ffelex_token_dollar_from_names(t,6);
4235 It's as if you made a new token of dollar type having the dollar
4236 at, in the example above, the sixth character of the NAMES token. */
4239 ffelex_token_dollar_from_names (ffelexToken t
, ffeTokenLength start
)
4244 assert (ffelex_token_type (t
) == FFELEX_typeNAMES
);
4245 assert (start
< t
->length
);
4246 assert (t
->text
[start
] == '$');
4248 /* Now make the token. */
4250 nt
= ffelex_token_new_ ();
4251 nt
->type
= FFELEX_typeDOLLAR
;
4254 ffewhere_set_from_track (&nt
->where_line
, &nt
->where_col
, t
->where_line
,
4255 t
->where_col
, t
->wheretrack
, start
);
4260 /* ffelex_token_kill -- Decrement use count for token, kill if no uses left
4263 ffelex_token_kill(t);
4265 Complements a call to ffelex_token_use or ffelex_token_new_.... */
4268 ffelex_token_kill (ffelexToken t
)
4272 assert (t
->uses
> 0);
4277 --ffelex_total_tokens_
;
4279 if (t
->type
== FFELEX_typeNAMES
)
4280 ffewhere_track_kill (t
->where_line
, t
->where_col
,
4281 t
->wheretrack
, t
->length
);
4282 ffewhere_line_kill (t
->where_line
);
4283 ffewhere_column_kill (t
->where_col
);
4284 if (t
->text
!= NULL
)
4285 malloc_kill_ksr (malloc_pool_image (), t
->text
, t
->size
+ 1);
4286 malloc_kill_ks (malloc_pool_image (), t
, sizeof (*t
));
4289 /* Make a new NAME token that is a substring of a NAMES token. */
4292 ffelex_token_name_from_names (ffelexToken t
, ffeTokenLength start
,
4298 assert (ffelex_token_type (t
) == FFELEX_typeNAMES
);
4299 assert (start
< t
->length
);
4301 len
= t
->length
- start
;
4305 assert ((start
+ len
) <= t
->length
);
4307 assert (ffelex_is_firstnamechar ((unsigned char)(t
->text
[start
])));
4309 nt
= ffelex_token_new_ ();
4310 nt
->type
= FFELEX_typeNAME
;
4311 nt
->size
= len
; /* Assume nobody's gonna fiddle with token
4315 ffewhere_set_from_track (&nt
->where_line
, &nt
->where_col
, t
->where_line
,
4316 t
->where_col
, t
->wheretrack
, start
);
4317 nt
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4319 strncpy (nt
->text
, t
->text
+ start
, len
);
4320 nt
->text
[len
] = '\0';
4324 /* Make a new NAMES token that is a substring of another NAMES token. */
4327 ffelex_token_names_from_names (ffelexToken t
, ffeTokenLength start
,
4333 assert (ffelex_token_type (t
) == FFELEX_typeNAMES
);
4334 assert (start
< t
->length
);
4336 len
= t
->length
- start
;
4340 assert ((start
+ len
) <= t
->length
);
4342 assert (ffelex_is_firstnamechar ((unsigned char)(t
->text
[start
])));
4344 nt
= ffelex_token_new_ ();
4345 nt
->type
= FFELEX_typeNAMES
;
4346 nt
->size
= len
; /* Assume nobody's gonna fiddle with token
4350 ffewhere_set_from_track (&nt
->where_line
, &nt
->where_col
, t
->where_line
,
4351 t
->where_col
, t
->wheretrack
, start
);
4352 ffewhere_track_copy (nt
->wheretrack
, t
->wheretrack
, start
, len
);
4353 nt
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4355 strncpy (nt
->text
, t
->text
+ start
, len
);
4356 nt
->text
[len
] = '\0';
4360 /* Make a new CHARACTER token. */
4363 ffelex_token_new_character (const char *s
, ffewhereLine l
, ffewhereColumn c
)
4367 t
= ffelex_token_new_ ();
4368 t
->type
= FFELEX_typeCHARACTER
;
4369 t
->length
= t
->size
= strlen (s
); /* Assume it won't get bigger. */
4371 t
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4373 strcpy (t
->text
, s
);
4374 t
->where_line
= ffewhere_line_use (l
);
4375 t
->where_col
= ffewhere_column_new (c
);
4379 /* Make a new EOF token right after end of file. */
4382 ffelex_token_new_eof (void)
4386 t
= ffelex_token_new_ ();
4387 t
->type
= FFELEX_typeEOF
;
4390 t
->where_line
= ffewhere_line_new (ffelex_linecount_current_
);
4391 t
->where_col
= ffewhere_column_new (1);
4395 /* Make a new NAME token. */
4398 ffelex_token_new_name (const char *s
, ffewhereLine l
, ffewhereColumn c
)
4402 assert (ffelex_is_firstnamechar ((unsigned char)*s
));
4404 t
= ffelex_token_new_ ();
4405 t
->type
= FFELEX_typeNAME
;
4406 t
->length
= t
->size
= strlen (s
); /* Assume it won't get bigger. */
4408 t
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4410 strcpy (t
->text
, s
);
4411 t
->where_line
= ffewhere_line_use (l
);
4412 t
->where_col
= ffewhere_column_new (c
);
4416 /* Make a new NAMES token. */
4419 ffelex_token_new_names (const char *s
, ffewhereLine l
, ffewhereColumn c
)
4423 assert (ffelex_is_firstnamechar ((unsigned char)*s
));
4425 t
= ffelex_token_new_ ();
4426 t
->type
= FFELEX_typeNAMES
;
4427 t
->length
= t
->size
= strlen (s
); /* Assume it won't get bigger. */
4429 t
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4431 strcpy (t
->text
, s
);
4432 t
->where_line
= ffewhere_line_use (l
);
4433 t
->where_col
= ffewhere_column_new (c
);
4434 ffewhere_track_clear (t
->wheretrack
, t
->length
); /* Assume contiguous
4439 /* Make a new NUMBER token.
4441 The first character of the string must be a digit, and only the digits
4442 are copied into the new number. So this may be used to easily extract
4443 a NUMBER token from within any text string. Then the length of the
4444 resulting token may be used to calculate where the digits stopped
4445 in the original string. */
4448 ffelex_token_new_number (const char *s
, ffewhereLine l
, ffewhereColumn c
)
4453 /* How long is the string of decimal digits at s? */
4455 len
= strspn (s
, "0123456789");
4457 /* Make sure there is at least one digit. */
4461 /* Now make the token. */
4463 t
= ffelex_token_new_ ();
4464 t
->type
= FFELEX_typeNUMBER
;
4465 t
->length
= t
->size
= len
; /* Assume it won't get bigger. */
4467 t
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4469 strncpy (t
->text
, s
, len
);
4470 t
->text
[len
] = '\0';
4471 t
->where_line
= ffewhere_line_use (l
);
4472 t
->where_col
= ffewhere_column_new (c
);
4476 /* Make a new token of any type that doesn't contain text. A private
4477 function that is used by public macros in the interface file. */
4480 ffelex_token_new_simple_ (ffelexType type
, ffewhereLine l
, ffewhereColumn c
)
4484 t
= ffelex_token_new_ ();
4488 t
->where_line
= ffewhere_line_use (l
);
4489 t
->where_col
= ffewhere_column_new (c
);
4493 /* Make a new NUMBER token from an existing NAMES token.
4495 Like ffelex_token_new_number, this function calculates the length
4496 of the digit string itself. */
4499 ffelex_token_number_from_names (ffelexToken t
, ffeTokenLength start
)
4505 assert (ffelex_token_type (t
) == FFELEX_typeNAMES
);
4506 assert (start
< t
->length
);
4508 /* How long is the string of decimal digits at s? */
4510 len
= strspn (t
->text
+ start
, "0123456789");
4512 /* Make sure there is at least one digit. */
4516 /* Now make the token. */
4518 nt
= ffelex_token_new_ ();
4519 nt
->type
= FFELEX_typeNUMBER
;
4520 nt
->size
= len
; /* Assume nobody's gonna fiddle with token
4524 ffewhere_set_from_track (&nt
->where_line
, &nt
->where_col
, t
->where_line
,
4525 t
->where_col
, t
->wheretrack
, start
);
4526 nt
->text
= malloc_new_ksr (malloc_pool_image (), "FFELEX token text",
4528 strncpy (nt
->text
, t
->text
+ start
, len
);
4529 nt
->text
[len
] = '\0';
4533 /* Make a new UNDERSCORE token from a NAMES token. */
4536 ffelex_token_uscore_from_names (ffelexToken t
, ffeTokenLength start
)
4541 assert (ffelex_token_type (t
) == FFELEX_typeNAMES
);
4542 assert (start
< t
->length
);
4543 assert (t
->text
[start
] == '_');
4545 /* Now make the token. */
4547 nt
= ffelex_token_new_ ();
4548 nt
->type
= FFELEX_typeUNDERSCORE
;
4550 ffewhere_set_from_track (&nt
->where_line
, &nt
->where_col
, t
->where_line
,
4551 t
->where_col
, t
->wheretrack
, start
);
4556 /* ffelex_token_use -- Return another instance of a token
4559 t = ffelex_token_use(t);
4561 In a sense, the new token is a copy of the old, though it might be the
4562 same with just a new use count.
4564 We use the use count method (easy). */
4567 ffelex_token_use (ffelexToken t
)
4570 assert ("_token_use: null token" == NULL
);
4575 #include "gt-f-lex.h"