More improvements of the Emacs manual
[emacs.git] / lib-src / make-docfile.c
blob61d53dc59d6c7666a3fd4307cb5bea71830b5e8c
1 /* Generate doc-string file for GNU Emacs from source files.
3 Copyright (C) 1985-1986, 1992-1994, 1997, 1999-2018 Free Software
4 Foundation, Inc.
6 This file is part of GNU Emacs.
8 GNU Emacs is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or (at
11 your option) any later version.
13 GNU Emacs is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>. */
22 /* The arguments given to this program are all the C and Lisp source files
23 of GNU Emacs. .elc and .el and .c files are allowed.
24 A .o file can also be specified; the .c file it was made from is used.
25 This helps the makefile pass the correct list of files.
26 Option -d DIR means change to DIR before looking for files.
28 The results, which go to standard output or to a file
29 specified with -a or -o (-a to append, -o to start from nothing),
30 are entries containing function or variable names and their documentation.
31 Each entry starts with a ^_ character.
32 Then comes F for a function or V for a variable.
33 Then comes the function or variable name, terminated with a newline.
34 Then comes the documentation for that function or variable.
37 #include <config.h>
39 #include <stdarg.h>
40 #include <stddef.h>
41 #include <stdint.h>
42 #include <stdlib.h>
43 #include <string.h>
45 #include <binary-io.h>
46 #include <intprops.h>
47 #include <min-max.h>
48 #include <unlocked-io.h>
50 #ifdef WINDOWSNT
51 /* Defined to be sys_fopen in ms-w32.h, but only #ifdef emacs, so this
52 is really just insurance. */
53 #undef fopen
54 #include <direct.h>
55 #endif /* WINDOWSNT */
57 #ifdef DOS_NT
58 /* Defined to be sys_chdir in ms-w32.h, but only #ifdef emacs, so this
59 is really just insurance.
61 Similarly, msdos defines this as sys_chdir, but we're not linking with the
62 file where that function is defined. */
63 #undef chdir
64 #define IS_SLASH(c) ((c) == '/' || (c) == '\\' || (c) == ':')
65 #else /* not DOS_NT */
66 #define IS_SLASH(c) ((c) == '/')
67 #endif /* not DOS_NT */
69 static void scan_file (char *filename);
70 static void scan_lisp_file (const char *filename, const char *mode);
71 static void scan_c_file (char *filename, const char *mode);
72 static void scan_c_stream (FILE *infile);
73 static void start_globals (void);
74 static void write_globals (void);
76 #include <unistd.h>
78 /* Name this program was invoked with. */
79 static char *progname;
81 /* True if this invocation is generating globals.h. */
82 static bool generate_globals;
84 /* Print error message. Args are like vprintf. */
86 static void ATTRIBUTE_FORMAT_PRINTF (1, 0)
87 verror (char const *m, va_list ap)
89 fprintf (stderr, "%s: ", progname);
90 vfprintf (stderr, m, ap);
91 fprintf (stderr, "\n");
94 /* Print error message. Args are like printf. */
96 static void ATTRIBUTE_FORMAT_PRINTF (1, 2)
97 error (char const *m, ...)
99 va_list ap;
100 va_start (ap, m);
101 verror (m, ap);
102 va_end (ap);
105 /* Print error message and exit. Args are like printf. */
107 static _Noreturn void ATTRIBUTE_FORMAT_PRINTF (1, 2)
108 fatal (char const *m, ...)
110 va_list ap;
111 va_start (ap, m);
112 verror (m, ap);
113 va_end (ap);
114 exit (EXIT_FAILURE);
117 static _Noreturn void
118 memory_exhausted (void)
120 fatal ("virtual memory exhausted");
123 /* Like malloc but get fatal error if memory is exhausted. */
125 static void *
126 xmalloc (ptrdiff_t size)
128 void *result = malloc (size);
129 if (result == NULL)
130 memory_exhausted ();
131 return result;
134 /* Like realloc but get fatal error if memory is exhausted. */
136 static void *
137 xrealloc (void *arg, ptrdiff_t size)
139 void *result = realloc (arg, size);
140 if (result == NULL)
141 memory_exhausted ();
142 return result;
147 main (int argc, char **argv)
149 int i;
151 progname = argv[0];
153 /* If first two args are -o FILE, output to FILE. */
154 i = 1;
155 if (argc > i + 1 && !strcmp (argv[i], "-o"))
157 if (! freopen (argv[i + 1], "w", stdout))
159 perror (argv[i + 1]);
160 return EXIT_FAILURE;
162 i += 2;
164 if (argc > i + 1 && !strcmp (argv[i], "-a"))
166 if (! freopen (argv[i + 1], "a", stdout))
168 perror (argv[i + 1]);
169 return EXIT_FAILURE;
171 i += 2;
173 if (argc > i + 1 && !strcmp (argv[i], "-d"))
175 if (chdir (argv[i + 1]) != 0)
177 perror (argv[i + 1]);
178 return EXIT_FAILURE;
180 i += 2;
182 if (argc > i && !strcmp (argv[i], "-g"))
184 generate_globals = true;
185 ++i;
188 set_binary_mode (fileno (stdout), O_BINARY);
190 if (generate_globals)
191 start_globals ();
193 if (argc <= i)
194 scan_c_stream (stdin);
195 else
197 int first_infile = i;
198 for (; i < argc; i++)
200 int j;
201 /* Don't process one file twice. */
202 for (j = first_infile; j < i; j++)
203 if (strcmp (argv[i], argv[j]) == 0)
204 break;
205 if (j == i)
206 scan_file (argv[i]);
210 if (generate_globals)
211 write_globals ();
213 if (ferror (stdout) || fclose (stdout) != 0)
214 fatal ("write error");
216 return EXIT_SUCCESS;
219 /* Add a source file name boundary marker in the output file. */
220 static void
221 put_filename (char *filename)
223 char *tmp;
225 for (tmp = filename; *tmp; tmp++)
227 if (IS_DIRECTORY_SEP (*tmp))
228 filename = tmp + 1;
231 printf ("\037S%s\n", filename);
234 /* Read file FILENAME and output its doc strings to stdout.
235 Return true if file is found, false otherwise. */
237 static void
238 scan_file (char *filename)
240 ptrdiff_t len = strlen (filename);
242 if (!generate_globals)
243 put_filename (filename);
244 if (len > 4 && !strcmp (filename + len - 4, ".elc"))
245 scan_lisp_file (filename, "rb");
246 else if (len > 3 && !strcmp (filename + len - 3, ".el"))
247 scan_lisp_file (filename, "r");
248 else
249 scan_c_file (filename, "r");
252 static void
253 start_globals (void)
255 puts ("/* This file was auto-generated by make-docfile. */");
256 puts ("/* DO NOT EDIT. */");
257 puts ("struct emacs_globals {");
260 static char input_buffer[128];
262 /* Some state during the execution of `read_c_string_or_comment'. */
263 struct rcsoc_state
265 /* A count of spaces and newlines that have been read, but not output. */
266 intmax_t pending_spaces, pending_newlines;
268 /* Where we're reading from. */
269 FILE *in_file;
271 /* If non-zero, a buffer into which to copy characters. */
272 char *buf_ptr;
273 /* If non-zero, a file into which to copy characters. */
274 FILE *out_file;
276 /* A keyword we look for at the beginning of lines. If found, it is
277 not copied, and SAW_KEYWORD is set to true. */
278 const char *keyword;
279 /* The current point we've reached in an occurrence of KEYWORD in
280 the input stream. */
281 const char *cur_keyword_ptr;
282 /* Set to true if we saw an occurrence of KEYWORD. */
283 bool saw_keyword;
286 /* Output CH to the file or buffer in STATE. Any pending newlines or
287 spaces are output first. */
289 static void
290 put_char (char ch, struct rcsoc_state *state)
292 char out_ch;
295 if (state->pending_newlines > 0)
297 state->pending_newlines--;
298 out_ch = '\n';
300 else if (state->pending_spaces > 0)
302 state->pending_spaces--;
303 out_ch = ' ';
305 else
306 out_ch = ch;
308 if (state->out_file)
309 putc (out_ch, state->out_file);
310 if (state->buf_ptr)
311 *state->buf_ptr++ = out_ch;
313 while (out_ch != ch);
316 /* If in the middle of scanning a keyword, continue scanning with
317 character CH, otherwise output CH to the file or buffer in STATE.
318 Any pending newlines or spaces are output first, as well as any
319 previously scanned characters that were thought to be part of a
320 keyword, but were in fact not. */
322 static void
323 scan_keyword_or_put_char (char ch, struct rcsoc_state *state)
325 if (state->keyword
326 && *state->cur_keyword_ptr == ch
327 && (state->cur_keyword_ptr > state->keyword
328 || state->pending_newlines > 0))
329 /* We might be looking at STATE->keyword at some point.
330 Keep looking until we know for sure. */
332 if (*++state->cur_keyword_ptr == '\0')
333 /* Saw the whole keyword. Set SAW_KEYWORD flag to true. */
335 state->saw_keyword = true;
337 /* Reset the scanning pointer. */
338 state->cur_keyword_ptr = state->keyword;
340 /* Canonicalize whitespace preceding a usage string. */
341 state->pending_newlines = 2;
342 state->pending_spaces = 0;
344 /* Skip any whitespace between the keyword and the
345 usage string. */
346 int c;
348 c = getc (state->in_file);
349 while (c == ' ' || c == '\n');
351 /* Output the open-paren we just read. */
352 if (c != '(')
353 fatal ("Missing '(' after keyword");
354 put_char (c, state);
356 /* Skip the function name and replace it with `fn'. */
359 c = getc (state->in_file);
360 if (c == EOF)
361 fatal ("Unexpected EOF after keyword");
363 while (c != ' ' && c != ')');
364 put_char ('f', state);
365 put_char ('n', state);
367 /* Put back the last character. */
368 ungetc (c, state->in_file);
371 else
373 if (state->keyword && state->cur_keyword_ptr > state->keyword)
374 /* We scanned the beginning of a potential usage
375 keyword, but it was a false alarm. Output the
376 part we scanned. */
378 const char *p;
380 for (p = state->keyword; p < state->cur_keyword_ptr; p++)
381 put_char (*p, state);
383 state->cur_keyword_ptr = state->keyword;
386 put_char (ch, state);
391 /* Skip a C string or C-style comment from INFILE, and return the
392 byte that follows, or EOF. COMMENT means skip a comment. If
393 PRINTFLAG is positive, output string contents to stdout. If it is
394 negative, store contents in buf. Convert escape sequences \n and
395 \t to newline and tab; discard \ followed by newline.
396 If SAW_USAGE is non-null, then any occurrences of the string "usage:"
397 at the beginning of a line will be removed, and *SAW_USAGE set to
398 true if any were encountered. */
400 static int
401 read_c_string_or_comment (FILE *infile, int printflag, bool comment,
402 bool *saw_usage)
404 int c;
405 struct rcsoc_state state;
407 state.in_file = infile;
408 state.buf_ptr = (printflag < 0 ? input_buffer : 0);
409 state.out_file = (printflag > 0 ? stdout : 0);
410 state.pending_spaces = 0;
411 state.pending_newlines = 0;
412 state.keyword = (saw_usage ? "usage:" : 0);
413 state.cur_keyword_ptr = state.keyword;
414 state.saw_keyword = false;
416 c = getc (infile);
417 if (comment)
418 while (c == '\n' || c == '\r' || c == '\t' || c == ' ')
419 c = getc (infile);
421 while (c != EOF)
423 while (c != EOF && (comment ? c != '*' : c != '"'))
425 if (c == '\\')
427 c = getc (infile);
428 if (c == '\n' || c == '\r')
430 c = getc (infile);
431 continue;
433 if (c == 'n')
434 c = '\n';
435 if (c == 't')
436 c = '\t';
439 if (c == ' ')
440 state.pending_spaces++;
441 else if (c == '\n')
443 state.pending_newlines++;
444 state.pending_spaces = 0;
446 else
447 scan_keyword_or_put_char (c, &state);
449 c = getc (infile);
452 if (c != EOF)
453 c = getc (infile);
455 if (comment)
457 if (c == '/')
459 c = getc (infile);
460 break;
463 scan_keyword_or_put_char ('*', &state);
465 else
467 if (c != '"')
468 break;
470 /* If we had a "", concatenate the two strings. */
471 c = getc (infile);
475 if (printflag < 0)
476 *state.buf_ptr = 0;
478 if (saw_usage)
479 *saw_usage = state.saw_keyword;
481 return c;
486 /* Write to stdout the argument names of function FUNC, whose text is in BUF.
487 MINARGS and MAXARGS are the minimum and maximum number of arguments. */
489 static void
490 write_c_args (char *func, char *buf, int minargs, int maxargs)
492 char *p;
493 bool in_ident = false;
494 char *ident_start UNINIT;
495 ptrdiff_t ident_length = 0;
497 fputs ("(fn", stdout);
499 if (*buf == '(')
500 ++buf;
502 for (p = buf; *p; p++)
504 char c = *p;
506 /* Notice when a new identifier starts. */
507 if ((('A' <= c && c <= 'Z')
508 || ('a' <= c && c <= 'z')
509 || ('0' <= c && c <= '9')
510 || c == '_')
511 != in_ident)
513 if (!in_ident)
515 in_ident = true;
516 ident_start = p;
518 else
520 in_ident = false;
521 ident_length = p - ident_start;
525 /* Found the end of an argument, write out the last seen
526 identifier. */
527 if (c == ',' || c == ')')
529 if (ident_length == 0)
531 error ("empty arg list for '%s' should be (void), not ()", func);
532 continue;
535 if (strncmp (ident_start, "void", ident_length) == 0)
536 continue;
538 putchar (' ');
540 if (minargs == 0 && maxargs > 0)
541 fputs ("&optional ", stdout);
543 minargs--;
544 maxargs--;
546 /* In C code, `default' is a reserved word, so we spell it
547 `defalt'; demangle that here. */
548 if (ident_length == 6 && memcmp (ident_start, "defalt", 6) == 0)
549 fputs ("DEFAULT", stdout);
550 else
551 while (ident_length-- > 0)
553 c = *ident_start++;
554 if (c >= 'a' && c <= 'z')
555 /* Upcase the letter. */
556 c += 'A' - 'a';
557 else if (c == '_')
558 /* Print underscore as hyphen. */
559 c = '-';
560 putchar (c);
565 putchar (')');
568 /* The types of globals. These are sorted roughly in decreasing alignment
569 order to avoid allocation gaps, except that symbols and functions
570 are last. */
571 enum global_type
573 INVALID,
574 LISP_OBJECT,
575 EMACS_INTEGER,
576 BOOLEAN,
577 SYMBOL,
578 FUNCTION
581 /* A single global. */
582 struct global
584 enum global_type type;
585 char *name;
586 int flags;
587 union
589 int value;
590 char const *svalue;
591 } v;
594 /* Bit values for FLAGS field from the above. Applied for DEFUNs only. */
595 enum { DEFUN_noreturn = 1, DEFUN_const = 2, DEFUN_noinline = 4 };
597 /* All the variable names we saw while scanning C sources in `-g'
598 mode. */
599 static ptrdiff_t num_globals;
600 static ptrdiff_t num_globals_allocated;
601 static struct global *globals;
603 static struct global *
604 add_global (enum global_type type, char const *name, int value,
605 char const *svalue)
607 /* Ignore the one non-symbol that can occur. */
608 if (strcmp (name, "..."))
610 if (num_globals == num_globals_allocated)
612 ptrdiff_t num_globals_max = (min (PTRDIFF_MAX, SIZE_MAX)
613 / sizeof *globals);
614 if (num_globals_allocated == num_globals_max)
615 memory_exhausted ();
616 if (num_globals_allocated < num_globals_max / 2)
617 num_globals_allocated = 2 * num_globals_allocated + 1;
618 else
619 num_globals_allocated = num_globals_max;
620 globals = xrealloc (globals, num_globals_allocated * sizeof *globals);
623 ++num_globals;
625 ptrdiff_t namesize = strlen (name) + 1;
626 char *buf = xmalloc (namesize + (svalue ? strlen (svalue) + 1 : 0));
627 globals[num_globals - 1].type = type;
628 globals[num_globals - 1].name = strcpy (buf, name);
629 if (svalue)
630 globals[num_globals - 1].v.svalue = strcpy (buf + namesize, svalue);
631 else
632 globals[num_globals - 1].v.value = value;
633 globals[num_globals - 1].flags = 0;
634 return globals + num_globals - 1;
636 return NULL;
639 static int
640 compare_globals (const void *a, const void *b)
642 const struct global *ga = a;
643 const struct global *gb = b;
645 if (ga->type != gb->type)
646 return ga->type - gb->type;
648 /* Consider "nil" to be the least, so that iQnil is zero. That
649 way, Qnil's internal representation is zero, which is a bit faster. */
650 if (ga->type == SYMBOL)
652 bool a_nil = strcmp (ga->name, "Qnil") == 0;
653 bool b_nil = strcmp (gb->name, "Qnil") == 0;
654 if (a_nil | b_nil)
655 return b_nil - a_nil;
658 return strcmp (ga->name, gb->name);
661 static void
662 close_emacs_globals (ptrdiff_t num_symbols)
664 printf (("};\n"
665 "extern struct emacs_globals globals;\n"
666 "\n"
667 "#ifndef DEFINE_SYMBOLS\n"
668 "extern\n"
669 "#endif\n"
670 "struct Lisp_Symbol lispsym[%td];\n"),
671 num_symbols);
674 static void
675 write_globals (void)
677 ptrdiff_t i, j;
678 bool seen_defun = false;
679 ptrdiff_t symnum = 0;
680 ptrdiff_t num_symbols = 0;
681 qsort (globals, num_globals, sizeof (struct global), compare_globals);
683 j = 0;
684 for (i = 0; i < num_globals; i++)
686 while (i + 1 < num_globals
687 && strcmp (globals[i].name, globals[i + 1].name) == 0)
689 if (globals[i].type == FUNCTION
690 && globals[i].v.value != globals[i + 1].v.value)
691 error ("function '%s' defined twice with differing signatures",
692 globals[i].name);
693 free (globals[i].name);
694 i++;
696 num_symbols += globals[i].type == SYMBOL;
697 globals[j++] = globals[i];
699 num_globals = j;
701 for (i = 0; i < num_globals; ++i)
703 char const *type = 0;
705 switch (globals[i].type)
707 case EMACS_INTEGER:
708 type = "EMACS_INT";
709 break;
710 case BOOLEAN:
711 type = "bool";
712 break;
713 case LISP_OBJECT:
714 type = "Lisp_Object";
715 break;
716 case SYMBOL:
717 case FUNCTION:
718 if (!seen_defun)
720 close_emacs_globals (num_symbols);
721 putchar ('\n');
722 seen_defun = true;
724 break;
725 default:
726 fatal ("not a recognized DEFVAR_");
729 if (type)
731 printf (" %s f_%s;\n", type, globals[i].name);
732 printf ("#define %s globals.f_%s\n",
733 globals[i].name, globals[i].name);
735 else if (globals[i].type == SYMBOL)
736 printf (("#define i%s %td\n"
737 "DEFINE_LISP_SYMBOL (%s)\n"),
738 globals[i].name, symnum++, globals[i].name);
739 else
741 if (globals[i].flags & DEFUN_noreturn)
742 fputs ("_Noreturn ", stdout);
743 if (globals[i].flags & DEFUN_noinline)
744 fputs ("NO_INLINE ", stdout);
746 printf ("EXFUN (%s, ", globals[i].name);
747 if (globals[i].v.value == -1)
748 fputs ("MANY", stdout);
749 else if (globals[i].v.value == -2)
750 fputs ("UNEVALLED", stdout);
751 else
752 printf ("%d", globals[i].v.value);
753 putchar (')');
755 if (globals[i].flags & DEFUN_const)
756 fputs (" ATTRIBUTE_CONST", stdout);
758 puts (";");
762 if (!seen_defun)
763 close_emacs_globals (num_symbols);
765 puts ("#ifdef DEFINE_SYMBOLS");
766 puts ("static char const *const defsym_name[] = {");
767 for (ptrdiff_t i = 0; i < num_globals; i++)
768 if (globals[i].type == SYMBOL)
769 printf ("\t\"%s\",\n", globals[i].v.svalue);
770 puts ("};");
771 puts ("#endif");
773 puts ("#define Qnil builtin_lisp_symbol (0)");
774 puts ("#if DEFINE_NON_NIL_Q_SYMBOL_MACROS");
775 num_symbols = 0;
776 for (ptrdiff_t i = 0; i < num_globals; i++)
777 if (globals[i].type == SYMBOL && num_symbols++ != 0)
778 printf ("# define %s builtin_lisp_symbol (%td)\n",
779 globals[i].name, num_symbols - 1);
780 puts ("#endif");
784 /* Read through a c file. If a .o file is named,
785 the corresponding .c or .m file is read instead.
786 Looks for DEFUN constructs such as are defined in ../src/lisp.h.
787 Accepts any word starting DEF... so it finds DEFSIMPLE and DEFPRED. */
789 static void
790 scan_c_file (char *filename, const char *mode)
792 FILE *infile;
793 char extension = filename[strlen (filename) - 1];
795 if (extension == 'o')
796 filename[strlen (filename) - 1] = 'c';
798 infile = fopen (filename, mode);
800 if (infile == NULL && extension == 'o')
802 /* Try .m. */
803 filename[strlen (filename) - 1] = 'm';
804 infile = fopen (filename, mode);
805 if (infile == NULL)
806 filename[strlen (filename) - 1] = 'c'; /* Don't confuse people. */
809 if (infile == NULL)
811 perror (filename);
812 exit (EXIT_FAILURE);
815 /* Reset extension to be able to detect duplicate files. */
816 filename[strlen (filename) - 1] = extension;
817 scan_c_stream (infile);
820 /* Return 1 if next input from INFILE is equal to P, -1 if EOF,
821 0 if input doesn't match. */
823 static int
824 stream_match (FILE *infile, const char *p)
826 for (; *p; p++)
828 int c = getc (infile);
829 if (c == EOF)
830 return -1;
831 if (c != *p)
832 return 0;
834 return 1;
837 static void
838 scan_c_stream (FILE *infile)
840 int commas, minargs, maxargs;
841 int c = '\n';
843 while (!feof (infile))
845 bool doc_keyword = false;
846 bool defunflag = false;
847 bool defvarperbufferflag = false;
848 bool defvarflag = false;
849 enum global_type type = INVALID;
850 static char name[sizeof input_buffer];
852 if (c != '\n' && c != '\r')
854 c = getc (infile);
855 continue;
857 c = getc (infile);
858 if (c == ' ')
860 while (c == ' ')
861 c = getc (infile);
862 if (c != 'D')
863 continue;
864 c = getc (infile);
865 if (c != 'E')
866 continue;
867 c = getc (infile);
868 if (c != 'F')
869 continue;
870 c = getc (infile);
871 if (c == 'S')
873 c = getc (infile);
874 if (c != 'Y')
875 continue;
876 c = getc (infile);
877 if (c != 'M')
878 continue;
879 c = getc (infile);
880 if (c != ' ' && c != '\t' && c != '(')
881 continue;
882 type = SYMBOL;
884 else if (c == 'V')
886 c = getc (infile);
887 if (c != 'A')
888 continue;
889 c = getc (infile);
890 if (c != 'R')
891 continue;
892 c = getc (infile);
893 if (c != '_')
894 continue;
896 defvarflag = true;
898 c = getc (infile);
899 defvarperbufferflag = (c == 'P');
900 if (generate_globals)
902 if (c == 'I')
903 type = EMACS_INTEGER;
904 else if (c == 'L')
905 type = LISP_OBJECT;
906 else if (c == 'B')
907 type = BOOLEAN;
910 c = getc (infile);
911 /* We need to distinguish between DEFVAR_BOOL and
912 DEFVAR_BUFFER_DEFAULTS. */
913 if (generate_globals && type == BOOLEAN && c != 'O')
914 type = INVALID;
916 else
917 continue;
919 else if (c == 'D')
921 c = getc (infile);
922 if (c != 'E')
923 continue;
924 c = getc (infile);
925 if (c != 'F')
926 continue;
927 c = getc (infile);
928 defunflag = c == 'U';
930 else continue;
932 if (generate_globals
933 && (!defvarflag || defvarperbufferflag || type == INVALID)
934 && !defunflag && type != SYMBOL)
935 continue;
937 while (c != '(')
939 if (c < 0)
940 goto eof;
941 c = getc (infile);
944 if (type != SYMBOL)
946 /* Lisp variable or function name. */
947 c = getc (infile);
948 if (c != '"')
949 continue;
950 c = read_c_string_or_comment (infile, -1, false, 0);
953 if (generate_globals)
955 ptrdiff_t i = 0;
956 char const *svalue = 0;
958 /* Skip "," and whitespace. */
961 c = getc (infile);
963 while (c == ',' || c == ' ' || c == '\t' || c == '\n' || c == '\r');
965 /* Read in the identifier. */
968 if (c < 0)
969 goto eof;
970 input_buffer[i++] = c;
971 if (sizeof input_buffer <= i)
972 fatal ("identifier too long");
973 c = getc (infile);
975 while (! (c == ',' || c == ' ' || c == '\t'
976 || c == '\n' || c == '\r'));
977 input_buffer[i] = '\0';
978 memcpy (name, input_buffer, i + 1);
980 if (type == SYMBOL)
983 c = getc (infile);
984 while (c == ' ' || c == '\t' || c == '\n' || c == '\r');
985 if (c != '"')
986 continue;
987 c = read_c_string_or_comment (infile, -1, false, 0);
988 svalue = input_buffer;
991 if (!defunflag)
993 add_global (type, name, 0, svalue);
994 continue;
998 if (type == SYMBOL)
999 continue;
1001 /* DEFVAR_LISP ("name", addr, "doc")
1002 DEFVAR_LISP ("name", addr /\* doc *\/)
1003 DEFVAR_LISP ("name", addr, doc: /\* doc *\/) */
1005 if (defunflag)
1006 commas = generate_globals ? 4 : 5;
1007 else if (defvarperbufferflag)
1008 commas = 3;
1009 else if (defvarflag)
1010 commas = 1;
1011 else /* For DEFSIMPLE and DEFPRED. */
1012 commas = 2;
1014 while (commas)
1016 if (c == ',')
1018 commas--;
1020 if (defunflag && (commas == 1 || commas == 2))
1022 int scanned = 0;
1024 c = getc (infile);
1025 while (c == ' ' || c == '\n' || c == '\r' || c == '\t');
1026 if (c < 0)
1027 goto eof;
1028 ungetc (c, infile);
1029 if (commas == 2) /* Pick up minargs. */
1030 scanned = fscanf (infile, "%d", &minargs);
1031 else /* Pick up maxargs. */
1032 if (c == 'M' || c == 'U') /* MANY || UNEVALLED */
1034 if (generate_globals)
1035 maxargs = (c == 'M') ? -1 : -2;
1036 else
1037 maxargs = -1;
1039 else
1040 scanned = fscanf (infile, "%d", &maxargs);
1041 if (scanned < 0)
1042 goto eof;
1046 if (c == EOF)
1047 goto eof;
1048 c = getc (infile);
1051 if (generate_globals)
1053 struct global *g = add_global (FUNCTION, name, maxargs, 0);
1054 if (!g)
1055 continue;
1057 /* The following code tries to recognize function attributes
1058 specified after the docstring, e.g.:
1060 DEFUN ("foo", Ffoo, Sfoo, X, Y, Z,
1061 doc: /\* doc *\/
1062 attributes: attribute1 attribute2 ...)
1063 (Lisp_Object arg...)
1065 Now only ’const’, ’noinline’ and 'noreturn' attributes
1066 are used. */
1068 /* Advance to the end of docstring. */
1069 c = getc (infile);
1070 if (c == EOF)
1071 goto eof;
1072 int d = getc (infile);
1073 if (d == EOF)
1074 goto eof;
1075 while (1)
1077 if (c == '*' && d == '/')
1078 break;
1079 c = d, d = getc (infile);
1080 if (d == EOF)
1081 goto eof;
1083 /* Skip spaces, if any. */
1086 c = getc (infile);
1087 if (c == EOF)
1088 goto eof;
1090 while (c == ' ' || c == '\n' || c == '\r' || c == '\t');
1091 /* Check for 'attributes:' token. */
1092 if (c == 'a' && stream_match (infile, "ttributes:"))
1094 char *p = input_buffer;
1095 /* Collect attributes up to ')'. */
1096 while (1)
1098 c = getc (infile);
1099 if (c == EOF)
1100 goto eof;
1101 if (c == ')')
1102 break;
1103 if (p - input_buffer > sizeof (input_buffer))
1104 abort ();
1105 *p++ = c;
1107 *p = 0;
1108 if (strstr (input_buffer, "noreturn"))
1109 g->flags |= DEFUN_noreturn;
1110 if (strstr (input_buffer, "const"))
1111 g->flags |= DEFUN_const;
1112 if (strstr (input_buffer, "noinline"))
1113 g->flags |= DEFUN_noinline;
1115 continue;
1118 while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
1119 c = getc (infile);
1121 if (c == '"')
1122 c = read_c_string_or_comment (infile, 0, false, 0);
1124 while (c != EOF && c != ',' && c != '/')
1125 c = getc (infile);
1126 if (c == ',')
1128 c = getc (infile);
1129 while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
1130 c = getc (infile);
1131 while ((c >= 'a' && c <= 'z') || (c >= 'Z' && c <= 'Z'))
1132 c = getc (infile);
1133 if (c == ':')
1135 doc_keyword = true;
1136 c = getc (infile);
1137 while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
1138 c = getc (infile);
1142 if (c == '"'
1143 || (c == '/'
1144 && (c = getc (infile),
1145 ungetc (c, infile),
1146 c == '*')))
1148 bool comment = c != '"';
1149 bool saw_usage;
1151 printf ("\037%c%s\n", defvarflag ? 'V' : 'F', input_buffer);
1153 if (comment)
1154 getc (infile); /* Skip past `*'. */
1155 c = read_c_string_or_comment (infile, 1, comment, &saw_usage);
1157 /* If this is a defun, find the arguments and print them. If
1158 this function takes MANY or UNEVALLED args, then the C source
1159 won't give the names of the arguments, so we shouldn't bother
1160 trying to find them.
1162 Various doc-string styles:
1163 0: DEFUN (..., "DOC") (args) [!comment]
1164 1: DEFUN (..., /\* DOC *\/ (args)) [comment && !doc_keyword]
1165 2: DEFUN (..., doc: /\* DOC *\/) (args) [comment && doc_keyword]
1167 if (defunflag && maxargs != -1 && !saw_usage)
1169 char argbuf[1024], *p = argbuf;
1171 if (!comment || doc_keyword)
1172 while (c != ')')
1174 if (c < 0)
1175 goto eof;
1176 c = getc (infile);
1179 /* Skip into arguments. */
1180 while (c != '(')
1182 if (c < 0)
1183 goto eof;
1184 c = getc (infile);
1186 /* Copy arguments into ARGBUF. */
1187 *p++ = c;
1189 *p++ = c = getc (infile);
1190 while (c != ')');
1191 *p = '\0';
1192 /* Output them. */
1193 fputs ("\n\n", stdout);
1194 write_c_args (input_buffer, argbuf, minargs, maxargs);
1196 else if (defunflag && maxargs == -1 && !saw_usage)
1197 /* The DOC should provide the usage form. */
1198 fprintf (stderr, "Missing 'usage' for function '%s'.\n",
1199 input_buffer);
1202 eof:
1203 if (ferror (infile) || fclose (infile) != 0)
1204 fatal ("read error");
1207 /* Read a file of Lisp code, compiled or interpreted.
1208 Looks for
1209 (defun NAME ARGS DOCSTRING ...)
1210 (defmacro NAME ARGS DOCSTRING ...)
1211 (defsubst NAME ARGS DOCSTRING ...)
1212 (autoload (quote NAME) FILE DOCSTRING ...)
1213 (defvar NAME VALUE DOCSTRING)
1214 (defconst NAME VALUE DOCSTRING)
1215 (fset (quote NAME) (make-byte-code ... DOCSTRING ...))
1216 (fset (quote NAME) #[... DOCSTRING ...])
1217 (defalias (quote NAME) #[... DOCSTRING ...])
1218 (custom-declare-variable (quote NAME) VALUE DOCSTRING ...)
1219 starting in column zero.
1220 (quote NAME) may appear as 'NAME as well.
1222 We also look for #@LENGTH CONTENTS^_ at the beginning of the line.
1223 When we find that, we save it for the following defining-form,
1224 and we use that instead of reading a doc string within that defining-form.
1226 For defvar, defconst, and fset we skip to the docstring with a kludgy
1227 formatting convention: all docstrings must appear on the same line as the
1228 initial open-paren (the one in column zero) and must contain a backslash
1229 and a newline immediately after the initial double-quote. No newlines
1230 must appear between the beginning of the form and the first double-quote.
1231 For defun, defmacro, and autoload, we know how to skip over the
1232 arglist, but the doc string must still have a backslash and newline
1233 immediately after the double quote.
1234 The only source files that must follow this convention are preloaded
1235 uncompiled ones like loaddefs.el; aside from that, it is always the .elc
1236 file that we should look at, and they are no problem because byte-compiler
1237 output follows this convention.
1238 The NAME and DOCSTRING are output.
1239 NAME is preceded by `F' for a function or `V' for a variable.
1240 An entry is output only if DOCSTRING has \ newline just after the opening ".
1243 static void
1244 skip_white (FILE *infile)
1246 char c = ' ';
1247 while (c == ' ' || c == '\t' || c == '\n' || c == '\r')
1248 c = getc (infile);
1249 ungetc (c, infile);
1252 static void
1253 read_lisp_symbol (FILE *infile, char *buffer)
1255 char c;
1256 char *fillp = buffer;
1258 skip_white (infile);
1259 while (1)
1261 c = getc (infile);
1262 if (c == '\\')
1263 *(++fillp) = getc (infile);
1264 else if (c == ' ' || c == '\t' || c == '\n' || c == '\r' || c == '(' || c == ')')
1266 ungetc (c, infile);
1267 *fillp = 0;
1268 break;
1270 else
1271 *fillp++ = c;
1274 if (! buffer[0])
1275 fprintf (stderr, "## expected a symbol, got '%c'\n", c);
1277 skip_white (infile);
1280 static bool
1281 search_lisp_doc_at_eol (FILE *infile)
1283 int c = 0, c1 = 0, c2 = 0;
1285 /* Skip until the end of line; remember two previous chars. */
1286 while (c != '\n' && c != '\r' && c != EOF)
1288 c2 = c1;
1289 c1 = c;
1290 c = getc (infile);
1293 /* If two previous characters were " and \,
1294 this is a doc string. Otherwise, there is none. */
1295 if (c2 != '"' || c1 != '\\')
1297 #ifdef DEBUG
1298 fprintf (stderr, "## non-docstring found\n");
1299 #endif
1300 ungetc (c, infile);
1301 return false;
1303 return true;
1306 #define DEF_ELISP_FILE(fn) { #fn, sizeof(#fn) - 1 }
1308 static void
1309 scan_lisp_file (const char *filename, const char *mode)
1311 FILE *infile;
1312 int c;
1313 char *saved_string = 0;
1314 /* These are the only files that are loaded uncompiled, and must
1315 follow the conventions of the doc strings expected by this
1316 function. These conventions are automatically followed by the
1317 byte compiler when it produces the .elc files. */
1318 static struct {
1319 const char *fn;
1320 int fl;
1321 } const uncompiled[] = {
1322 DEF_ELISP_FILE (loaddefs.el),
1323 DEF_ELISP_FILE (loadup.el),
1324 DEF_ELISP_FILE (charprop.el),
1325 DEF_ELISP_FILE (cp51932.el),
1326 DEF_ELISP_FILE (eucjp-ms.el)
1328 int i;
1329 int flen = strlen (filename);
1331 if (generate_globals)
1332 fatal ("scanning lisp file when -g specified");
1333 if (flen > 3 && !strcmp (filename + flen - 3, ".el"))
1335 bool match = false;
1336 for (i = 0; i < sizeof (uncompiled) / sizeof (uncompiled[0]); i++)
1338 if (uncompiled[i].fl <= flen
1339 && !strcmp (filename + flen - uncompiled[i].fl, uncompiled[i].fn)
1340 && (flen == uncompiled[i].fl
1341 || IS_SLASH (filename[flen - uncompiled[i].fl - 1])))
1343 match = true;
1344 break;
1347 if (!match)
1348 fatal ("uncompiled lisp file %s is not supported", filename);
1351 infile = fopen (filename, mode);
1352 if (infile == NULL)
1354 perror (filename);
1355 exit (EXIT_FAILURE);
1358 c = '\n';
1359 while (!feof (infile))
1361 char buffer[BUFSIZ];
1362 char type;
1364 /* If not at end of line, skip till we get to one. */
1365 if (c != '\n' && c != '\r')
1367 c = getc (infile);
1368 continue;
1370 /* Skip the line break. */
1371 while (c == '\n' || c == '\r')
1372 c = getc (infile);
1373 /* Detect a dynamic doc string and save it for the next expression. */
1374 if (c == '#')
1376 c = getc (infile);
1377 if (c == '@')
1379 ptrdiff_t length = 0;
1380 ptrdiff_t i;
1382 /* Read the length. */
1383 while ((c = getc (infile),
1384 c >= '0' && c <= '9'))
1386 if (INT_MULTIPLY_WRAPV (length, 10, &length)
1387 || INT_ADD_WRAPV (length, c - '0', &length)
1388 || SIZE_MAX < length)
1389 memory_exhausted ();
1392 if (length <= 1)
1393 fatal ("invalid dynamic doc string length");
1395 if (c != ' ')
1396 fatal ("space not found after dynamic doc string length");
1398 /* The next character is a space that is counted in the length
1399 but not part of the doc string.
1400 We already read it, so just ignore it. */
1401 length--;
1403 /* Read in the contents. */
1404 free (saved_string);
1405 saved_string = xmalloc (length);
1406 for (i = 0; i < length; i++)
1407 saved_string[i] = getc (infile);
1408 /* The last character is a ^_.
1409 That is needed in the .elc file
1410 but it is redundant in DOC. So get rid of it here. */
1411 saved_string[length - 1] = 0;
1412 /* Skip the line break. */
1413 while (c == '\n' || c == '\r')
1414 c = getc (infile);
1415 /* Skip the following line. */
1416 while (c != '\n' && c != '\r')
1417 c = getc (infile);
1419 continue;
1422 if (c != '(')
1423 continue;
1425 read_lisp_symbol (infile, buffer);
1427 if (! strcmp (buffer, "defun")
1428 || ! strcmp (buffer, "defmacro")
1429 || ! strcmp (buffer, "defsubst"))
1431 type = 'F';
1432 read_lisp_symbol (infile, buffer);
1434 /* Skip the arguments: either "nil" or a list in parens. */
1436 c = getc (infile);
1437 if (c == 'n') /* nil */
1439 if ((c = getc (infile)) != 'i'
1440 || (c = getc (infile)) != 'l')
1442 fprintf (stderr, "## unparsable arglist in %s (%s)\n",
1443 buffer, filename);
1444 continue;
1447 else if (c != '(')
1449 fprintf (stderr, "## unparsable arglist in %s (%s)\n",
1450 buffer, filename);
1451 continue;
1453 else
1454 while (c != ')')
1455 c = getc (infile);
1456 skip_white (infile);
1458 /* If the next three characters aren't `dquote bslash newline'
1459 then we're not reading a docstring.
1461 if ((c = getc (infile)) != '"'
1462 || (c = getc (infile)) != '\\'
1463 || ((c = getc (infile)) != '\n' && c != '\r'))
1465 #ifdef DEBUG
1466 fprintf (stderr, "## non-docstring in %s (%s)\n",
1467 buffer, filename);
1468 #endif
1469 continue;
1473 /* defcustom can only occur in uncompiled Lisp files. */
1474 else if (! strcmp (buffer, "defvar")
1475 || ! strcmp (buffer, "defconst")
1476 || ! strcmp (buffer, "defcustom"))
1478 type = 'V';
1479 read_lisp_symbol (infile, buffer);
1481 if (saved_string == 0)
1482 if (!search_lisp_doc_at_eol (infile))
1483 continue;
1486 else if (! strcmp (buffer, "custom-declare-variable")
1487 || ! strcmp (buffer, "defvaralias")
1490 type = 'V';
1492 c = getc (infile);
1493 if (c == '\'')
1494 read_lisp_symbol (infile, buffer);
1495 else
1497 if (c != '(')
1499 fprintf (stderr,
1500 "## unparsable name in custom-declare-variable in %s\n",
1501 filename);
1502 continue;
1504 read_lisp_symbol (infile, buffer);
1505 if (strcmp (buffer, "quote"))
1507 fprintf (stderr,
1508 "## unparsable name in custom-declare-variable in %s\n",
1509 filename);
1510 continue;
1512 read_lisp_symbol (infile, buffer);
1513 c = getc (infile);
1514 if (c != ')')
1516 fprintf (stderr,
1517 "## unparsable quoted name in custom-declare-variable in %s\n",
1518 filename);
1519 continue;
1523 if (saved_string == 0)
1524 if (!search_lisp_doc_at_eol (infile))
1525 continue;
1528 else if (! strcmp (buffer, "fset") || ! strcmp (buffer, "defalias"))
1530 type = 'F';
1532 c = getc (infile);
1533 if (c == '\'')
1534 read_lisp_symbol (infile, buffer);
1535 else
1537 if (c != '(')
1539 fprintf (stderr, "## unparsable name in fset in %s\n",
1540 filename);
1541 continue;
1543 read_lisp_symbol (infile, buffer);
1544 if (strcmp (buffer, "quote"))
1546 fprintf (stderr, "## unparsable name in fset in %s\n",
1547 filename);
1548 continue;
1550 read_lisp_symbol (infile, buffer);
1551 c = getc (infile);
1552 if (c != ')')
1554 fprintf (stderr,
1555 "## unparsable quoted name in fset in %s\n",
1556 filename);
1557 continue;
1561 if (saved_string == 0)
1562 if (!search_lisp_doc_at_eol (infile))
1563 continue;
1566 else if (! strcmp (buffer, "autoload"))
1568 type = 'F';
1569 c = getc (infile);
1570 if (c == '\'')
1571 read_lisp_symbol (infile, buffer);
1572 else
1574 if (c != '(')
1576 fprintf (stderr, "## unparsable name in autoload in %s\n",
1577 filename);
1578 continue;
1580 read_lisp_symbol (infile, buffer);
1581 if (strcmp (buffer, "quote"))
1583 fprintf (stderr, "## unparsable name in autoload in %s\n",
1584 filename);
1585 continue;
1587 read_lisp_symbol (infile, buffer);
1588 c = getc (infile);
1589 if (c != ')')
1591 fprintf (stderr,
1592 "## unparsable quoted name in autoload in %s\n",
1593 filename);
1594 continue;
1597 skip_white (infile);
1598 if ((c = getc (infile)) != '\"')
1600 fprintf (stderr, "## autoload of %s unparsable (%s)\n",
1601 buffer, filename);
1602 continue;
1604 read_c_string_or_comment (infile, 0, false, 0);
1606 if (saved_string == 0)
1607 if (!search_lisp_doc_at_eol (infile))
1608 continue;
1611 #ifdef DEBUG
1612 else if (! strcmp (buffer, "if")
1613 || ! strcmp (buffer, "byte-code"))
1614 continue;
1615 #endif
1617 else
1619 #ifdef DEBUG
1620 fprintf (stderr, "## unrecognized top-level form, %s (%s)\n",
1621 buffer, filename);
1622 #endif
1623 continue;
1626 /* At this point, we should either use the previous dynamic doc string in
1627 saved_string or gobble a doc string from the input file.
1628 In the latter case, the opening quote (and leading backslash-newline)
1629 have already been read. */
1631 printf ("\037%c%s\n", type, buffer);
1632 if (saved_string)
1634 fputs (saved_string, stdout);
1635 /* Don't use one dynamic doc string twice. */
1636 free (saved_string);
1637 saved_string = 0;
1639 else
1640 read_c_string_or_comment (infile, 1, false, 0);
1642 free (saved_string);
1643 if (ferror (infile) || fclose (infile) != 0)
1644 fatal ("%s: read error", filename);
1648 /* make-docfile.c ends here */