1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654 |
- /* Generate doc-string file for GNU Emacs from source files.
- Copyright (C) 1985-1986, 1992-1994, 1997, 1999-2016 Free Software
- Foundation, Inc.
- This file is part of GNU Emacs.
- GNU Emacs is free software: you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation, either version 3 of the License, or (at
- your option) any later version.
- GNU Emacs is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
- /* The arguments given to this program are all the C and Lisp source files
- of GNU Emacs. .elc and .el and .c files are allowed.
- A .o file can also be specified; the .c file it was made from is used.
- This helps the makefile pass the correct list of files.
- Option -d DIR means change to DIR before looking for files.
- The results, which go to standard output or to a file
- specified with -a or -o (-a to append, -o to start from nothing),
- are entries containing function or variable names and their documentation.
- Each entry starts with a ^_ character.
- Then comes F for a function or V for a variable.
- Then comes the function or variable name, terminated with a newline.
- Then comes the documentation for that function or variable.
- */
- #include <config.h>
- #include <stdarg.h>
- #include <stdbool.h>
- #include <stddef.h>
- #include <stdint.h>
- #include <stdio.h>
- #include <stdlib.h> /* config.h unconditionally includes this anyway */
- #ifdef WINDOWSNT
- /* Defined to be sys_fopen in ms-w32.h, but only #ifdef emacs, so this
- is really just insurance. */
- #undef fopen
- #include <direct.h>
- #endif /* WINDOWSNT */
- #include <binary-io.h>
- #include <intprops.h>
- #include <min-max.h>
- #ifdef DOS_NT
- /* Defined to be sys_chdir in ms-w32.h, but only #ifdef emacs, so this
- is really just insurance.
- Similarly, msdos defines this as sys_chdir, but we're not linking with the
- file where that function is defined. */
- #undef chdir
- #define IS_SLASH(c) ((c) == '/' || (c) == '\\' || (c) == ':')
- #else /* not DOS_NT */
- #define IS_SLASH(c) ((c) == '/')
- #endif /* not DOS_NT */
- static void scan_file (char *filename);
- static void scan_lisp_file (const char *filename, const char *mode);
- static void scan_c_file (char *filename, const char *mode);
- static void scan_c_stream (FILE *infile);
- static void start_globals (void);
- static void write_globals (void);
- #include <unistd.h>
- /* Name this program was invoked with. */
- static char *progname;
- /* True if this invocation is generating globals.h. */
- static bool generate_globals;
- /* Print error message. Args are like vprintf. */
- static void ATTRIBUTE_FORMAT_PRINTF (1, 0)
- verror (char const *m, va_list ap)
- {
- fprintf (stderr, "%s: ", progname);
- vfprintf (stderr, m, ap);
- fprintf (stderr, "\n");
- }
- /* Print error message. Args are like printf. */
- static void ATTRIBUTE_FORMAT_PRINTF (1, 2)
- error (char const *m, ...)
- {
- va_list ap;
- va_start (ap, m);
- verror (m, ap);
- va_end (ap);
- }
- /* Print error message and exit. Args are like printf. */
- static _Noreturn void ATTRIBUTE_FORMAT_PRINTF (1, 2)
- fatal (char const *m, ...)
- {
- va_list ap;
- va_start (ap, m);
- verror (m, ap);
- va_end (ap);
- exit (EXIT_FAILURE);
- }
- static _Noreturn void
- memory_exhausted (void)
- {
- fatal ("virtual memory exhausted");
- }
- /* Like malloc but get fatal error if memory is exhausted. */
- static void *
- xmalloc (ptrdiff_t size)
- {
- void *result = malloc (size);
- if (result == NULL)
- memory_exhausted ();
- return result;
- }
- /* Like realloc but get fatal error if memory is exhausted. */
- static void *
- xrealloc (void *arg, ptrdiff_t size)
- {
- void *result = realloc (arg, size);
- if (result == NULL)
- memory_exhausted ();
- return result;
- }
- int
- main (int argc, char **argv)
- {
- int i;
- progname = argv[0];
- /* If first two args are -o FILE, output to FILE. */
- i = 1;
- if (argc > i + 1 && !strcmp (argv[i], "-o"))
- {
- if (! freopen (argv[i + 1], "w", stdout))
- {
- perror (argv[i + 1]);
- return EXIT_FAILURE;
- }
- i += 2;
- }
- if (argc > i + 1 && !strcmp (argv[i], "-a"))
- {
- if (! freopen (argv[i + 1], "a", stdout))
- {
- perror (argv[i + 1]);
- return EXIT_FAILURE;
- }
- i += 2;
- }
- if (argc > i + 1 && !strcmp (argv[i], "-d"))
- {
- if (chdir (argv[i + 1]) != 0)
- {
- perror (argv[i + 1]);
- return EXIT_FAILURE;
- }
- i += 2;
- }
- if (argc > i && !strcmp (argv[i], "-g"))
- {
- generate_globals = true;
- ++i;
- }
- set_binary_mode (fileno (stdout), O_BINARY);
- if (generate_globals)
- start_globals ();
- if (argc <= i)
- scan_c_stream (stdin);
- else
- {
- int first_infile = i;
- for (; i < argc; i++)
- {
- int j;
- /* Don't process one file twice. */
- for (j = first_infile; j < i; j++)
- if (strcmp (argv[i], argv[j]) == 0)
- break;
- if (j == i)
- scan_file (argv[i]);
- }
- }
- if (generate_globals)
- write_globals ();
- if (ferror (stdout) || fclose (stdout) != 0)
- fatal ("write error");
- return EXIT_SUCCESS;
- }
- /* Add a source file name boundary marker in the output file. */
- static void
- put_filename (char *filename)
- {
- char *tmp;
- for (tmp = filename; *tmp; tmp++)
- {
- if (IS_DIRECTORY_SEP (*tmp))
- filename = tmp + 1;
- }
- printf ("\037S%s\n", filename);
- }
- /* Read file FILENAME and output its doc strings to stdout.
- Return true if file is found, false otherwise. */
- static void
- scan_file (char *filename)
- {
- ptrdiff_t len = strlen (filename);
- if (!generate_globals)
- put_filename (filename);
- if (len > 4 && !strcmp (filename + len - 4, ".elc"))
- scan_lisp_file (filename, "rb");
- else if (len > 3 && !strcmp (filename + len - 3, ".el"))
- scan_lisp_file (filename, "r");
- else
- scan_c_file (filename, "r");
- }
- static void
- start_globals (void)
- {
- puts ("/* This file was auto-generated by make-docfile. */");
- puts ("/* DO NOT EDIT. */");
- puts ("struct emacs_globals {");
- }
- static char input_buffer[128];
- /* Some state during the execution of `read_c_string_or_comment'. */
- struct rcsoc_state
- {
- /* A count of spaces and newlines that have been read, but not output. */
- intmax_t pending_spaces, pending_newlines;
- /* Where we're reading from. */
- FILE *in_file;
- /* If non-zero, a buffer into which to copy characters. */
- char *buf_ptr;
- /* If non-zero, a file into which to copy characters. */
- FILE *out_file;
- /* A keyword we look for at the beginning of lines. If found, it is
- not copied, and SAW_KEYWORD is set to true. */
- const char *keyword;
- /* The current point we've reached in an occurrence of KEYWORD in
- the input stream. */
- const char *cur_keyword_ptr;
- /* Set to true if we saw an occurrence of KEYWORD. */
- bool saw_keyword;
- };
- /* Output CH to the file or buffer in STATE. Any pending newlines or
- spaces are output first. */
- static void
- put_char (char ch, struct rcsoc_state *state)
- {
- char out_ch;
- do
- {
- if (state->pending_newlines > 0)
- {
- state->pending_newlines--;
- out_ch = '\n';
- }
- else if (state->pending_spaces > 0)
- {
- state->pending_spaces--;
- out_ch = ' ';
- }
- else
- out_ch = ch;
- if (state->out_file)
- putc (out_ch, state->out_file);
- if (state->buf_ptr)
- *state->buf_ptr++ = out_ch;
- }
- while (out_ch != ch);
- }
- /* If in the middle of scanning a keyword, continue scanning with
- character CH, otherwise output CH to the file or buffer in STATE.
- Any pending newlines or spaces are output first, as well as any
- previously scanned characters that were thought to be part of a
- keyword, but were in fact not. */
- static void
- scan_keyword_or_put_char (char ch, struct rcsoc_state *state)
- {
- if (state->keyword
- && *state->cur_keyword_ptr == ch
- && (state->cur_keyword_ptr > state->keyword
- || state->pending_newlines > 0))
- /* We might be looking at STATE->keyword at some point.
- Keep looking until we know for sure. */
- {
- if (*++state->cur_keyword_ptr == '\0')
- /* Saw the whole keyword. Set SAW_KEYWORD flag to true. */
- {
- state->saw_keyword = true;
- /* Reset the scanning pointer. */
- state->cur_keyword_ptr = state->keyword;
- /* Canonicalize whitespace preceding a usage string. */
- state->pending_newlines = 2;
- state->pending_spaces = 0;
- /* Skip any whitespace between the keyword and the
- usage string. */
- int c;
- do
- c = getc (state->in_file);
- while (c == ' ' || c == '\n');
- /* Output the open-paren we just read. */
- if (c != '(')
- fatal ("Missing '(' after keyword");
- put_char (c, state);
- /* Skip the function name and replace it with `fn'. */
- do
- {
- c = getc (state->in_file);
- if (c == EOF)
- fatal ("Unexpected EOF after keyword");
- }
- while (c != ' ' && c != ')');
- put_char ('f', state);
- put_char ('n', state);
- /* Put back the last character. */
- ungetc (c, state->in_file);
- }
- }
- else
- {
- if (state->keyword && state->cur_keyword_ptr > state->keyword)
- /* We scanned the beginning of a potential usage
- keyword, but it was a false alarm. Output the
- part we scanned. */
- {
- const char *p;
- for (p = state->keyword; p < state->cur_keyword_ptr; p++)
- put_char (*p, state);
- state->cur_keyword_ptr = state->keyword;
- }
- put_char (ch, state);
- }
- }
- /* Skip a C string or C-style comment from INFILE, and return the
- byte that follows, or EOF. COMMENT means skip a comment. If
- PRINTFLAG is positive, output string contents to stdout. If it is
- negative, store contents in buf. Convert escape sequences \n and
- \t to newline and tab; discard \ followed by newline.
- If SAW_USAGE is non-null, then any occurrences of the string "usage:"
- at the beginning of a line will be removed, and *SAW_USAGE set to
- true if any were encountered. */
- static int
- read_c_string_or_comment (FILE *infile, int printflag, bool comment,
- bool *saw_usage)
- {
- int c;
- struct rcsoc_state state;
- state.in_file = infile;
- state.buf_ptr = (printflag < 0 ? input_buffer : 0);
- state.out_file = (printflag > 0 ? stdout : 0);
- state.pending_spaces = 0;
- state.pending_newlines = 0;
- state.keyword = (saw_usage ? "usage:" : 0);
- state.cur_keyword_ptr = state.keyword;
- state.saw_keyword = false;
- c = getc (infile);
- if (comment)
- while (c == '\n' || c == '\r' || c == '\t' || c == ' ')
- c = getc (infile);
- while (c != EOF)
- {
- while (c != EOF && (comment ? c != '*' : c != '"'))
- {
- if (c == '\\')
- {
- c = getc (infile);
- if (c == '\n' || c == '\r')
- {
- c = getc (infile);
- continue;
- }
- if (c == 'n')
- c = '\n';
- if (c == 't')
- c = '\t';
- }
- if (c == ' ')
- state.pending_spaces++;
- else if (c == '\n')
- {
- state.pending_newlines++;
- state.pending_spaces = 0;
- }
- else
- scan_keyword_or_put_char (c, &state);
- c = getc (infile);
- }
- if (c != EOF)
- c = getc (infile);
- if (comment)
- {
- if (c == '/')
- {
- c = getc (infile);
- break;
- }
- scan_keyword_or_put_char ('*', &state);
- }
- else
- {
- if (c != '"')
- break;
- /* If we had a "", concatenate the two strings. */
- c = getc (infile);
- }
- }
- if (printflag < 0)
- *state.buf_ptr = 0;
- if (saw_usage)
- *saw_usage = state.saw_keyword;
- return c;
- }
- /* Write to stdout the argument names of function FUNC, whose text is in BUF.
- MINARGS and MAXARGS are the minimum and maximum number of arguments. */
- static void
- write_c_args (char *func, char *buf, int minargs, int maxargs)
- {
- char *p;
- bool in_ident = false;
- char *ident_start IF_LINT (= NULL);
- ptrdiff_t ident_length = 0;
- fputs ("(fn", stdout);
- if (*buf == '(')
- ++buf;
- for (p = buf; *p; p++)
- {
- char c = *p;
- /* Notice when a new identifier starts. */
- if ((('A' <= c && c <= 'Z')
- || ('a' <= c && c <= 'z')
- || ('0' <= c && c <= '9')
- || c == '_')
- != in_ident)
- {
- if (!in_ident)
- {
- in_ident = true;
- ident_start = p;
- }
- else
- {
- in_ident = false;
- ident_length = p - ident_start;
- }
- }
- /* Found the end of an argument, write out the last seen
- identifier. */
- if (c == ',' || c == ')')
- {
- if (ident_length == 0)
- {
- error ("empty arg list for '%s' should be (void), not ()", func);
- continue;
- }
- if (strncmp (ident_start, "void", ident_length) == 0)
- continue;
- putchar (' ');
- if (minargs == 0 && maxargs > 0)
- fputs ("&optional ", stdout);
- minargs--;
- maxargs--;
- /* In C code, `default' is a reserved word, so we spell it
- `defalt'; demangle that here. */
- if (ident_length == 6 && memcmp (ident_start, "defalt", 6) == 0)
- fputs ("DEFAULT", stdout);
- else
- while (ident_length-- > 0)
- {
- c = *ident_start++;
- if (c >= 'a' && c <= 'z')
- /* Upcase the letter. */
- c += 'A' - 'a';
- else if (c == '_')
- /* Print underscore as hyphen. */
- c = '-';
- putchar (c);
- }
- }
- }
- putchar (')');
- }
- /* The types of globals. These are sorted roughly in decreasing alignment
- order to avoid allocation gaps, except that symbols and functions
- are last. */
- enum global_type
- {
- INVALID,
- LISP_OBJECT,
- EMACS_INTEGER,
- BOOLEAN,
- SYMBOL,
- FUNCTION
- };
- /* A single global. */
- struct global
- {
- enum global_type type;
- char *name;
- int flags;
- union
- {
- int value;
- char const *svalue;
- } v;
- };
- /* Bit values for FLAGS field from the above. Applied for DEFUNs only. */
- enum { DEFUN_noreturn = 1, DEFUN_const = 2 };
- /* All the variable names we saw while scanning C sources in `-g'
- mode. */
- static ptrdiff_t num_globals;
- static ptrdiff_t num_globals_allocated;
- static struct global *globals;
- static struct global *
- add_global (enum global_type type, char const *name, int value,
- char const *svalue)
- {
- /* Ignore the one non-symbol that can occur. */
- if (strcmp (name, "..."))
- {
- if (num_globals == num_globals_allocated)
- {
- ptrdiff_t num_globals_max = (min (PTRDIFF_MAX, SIZE_MAX)
- / sizeof *globals);
- if (num_globals_allocated == num_globals_max)
- memory_exhausted ();
- if (num_globals_allocated < num_globals_max / 2)
- num_globals_allocated = 2 * num_globals_allocated + 1;
- else
- num_globals_allocated = num_globals_max;
- globals = xrealloc (globals, num_globals_allocated * sizeof *globals);
- }
- ++num_globals;
- ptrdiff_t namesize = strlen (name) + 1;
- char *buf = xmalloc (namesize + (svalue ? strlen (svalue) + 1 : 0));
- globals[num_globals - 1].type = type;
- globals[num_globals - 1].name = strcpy (buf, name);
- if (svalue)
- globals[num_globals - 1].v.svalue = strcpy (buf + namesize, svalue);
- else
- globals[num_globals - 1].v.value = value;
- globals[num_globals - 1].flags = 0;
- return globals + num_globals - 1;
- }
- return NULL;
- }
- static int
- compare_globals (const void *a, const void *b)
- {
- const struct global *ga = a;
- const struct global *gb = b;
- if (ga->type != gb->type)
- return ga->type - gb->type;
- /* Consider "nil" to be the least, so that iQnil is zero. That
- way, Qnil's internal representation is zero, which is a bit faster. */
- if (ga->type == SYMBOL)
- {
- bool a_nil = strcmp (ga->name, "Qnil") == 0;
- bool b_nil = strcmp (gb->name, "Qnil") == 0;
- if (a_nil | b_nil)
- return b_nil - a_nil;
- }
- return strcmp (ga->name, gb->name);
- }
- static void
- close_emacs_globals (ptrdiff_t num_symbols)
- {
- printf (("};\n"
- "extern struct emacs_globals globals;\n"
- "\n"
- "#ifndef DEFINE_SYMBOLS\n"
- "extern\n"
- "#endif\n"
- "struct Lisp_Symbol alignas (GCALIGNMENT) lispsym[%td];\n"),
- num_symbols);
- }
- static void
- write_globals (void)
- {
- ptrdiff_t i, j;
- bool seen_defun = false;
- ptrdiff_t symnum = 0;
- ptrdiff_t num_symbols = 0;
- qsort (globals, num_globals, sizeof (struct global), compare_globals);
- j = 0;
- for (i = 0; i < num_globals; i++)
- {
- while (i + 1 < num_globals
- && strcmp (globals[i].name, globals[i + 1].name) == 0)
- {
- if (globals[i].type == FUNCTION
- && globals[i].v.value != globals[i + 1].v.value)
- error ("function '%s' defined twice with differing signatures",
- globals[i].name);
- free (globals[i].name);
- i++;
- }
- num_symbols += globals[i].type == SYMBOL;
- globals[j++] = globals[i];
- }
- num_globals = j;
- for (i = 0; i < num_globals; ++i)
- {
- char const *type = 0;
- switch (globals[i].type)
- {
- case EMACS_INTEGER:
- type = "EMACS_INT";
- break;
- case BOOLEAN:
- type = "bool";
- break;
- case LISP_OBJECT:
- type = "Lisp_Object";
- break;
- case SYMBOL:
- case FUNCTION:
- if (!seen_defun)
- {
- close_emacs_globals (num_symbols);
- putchar ('\n');
- seen_defun = true;
- }
- break;
- default:
- fatal ("not a recognized DEFVAR_");
- }
- if (type)
- {
- printf (" %s f_%s;\n", type, globals[i].name);
- printf ("#define %s globals.f_%s\n",
- globals[i].name, globals[i].name);
- }
- else if (globals[i].type == SYMBOL)
- printf (("#define i%s %td\n"
- "DEFINE_LISP_SYMBOL (%s)\n"),
- globals[i].name, symnum++, globals[i].name);
- else
- {
- if (globals[i].flags & DEFUN_noreturn)
- fputs ("_Noreturn ", stdout);
- printf ("EXFUN (%s, ", globals[i].name);
- if (globals[i].v.value == -1)
- fputs ("MANY", stdout);
- else if (globals[i].v.value == -2)
- fputs ("UNEVALLED", stdout);
- else
- printf ("%d", globals[i].v.value);
- putchar (')');
- if (globals[i].flags & DEFUN_const)
- fputs (" ATTRIBUTE_CONST", stdout);
- puts (";");
- }
- }
- if (!seen_defun)
- close_emacs_globals (num_symbols);
- puts ("#ifdef DEFINE_SYMBOLS");
- puts ("static char const *const defsym_name[] = {");
- for (ptrdiff_t i = 0; i < num_globals; i++)
- if (globals[i].type == SYMBOL)
- printf ("\t\"%s\",\n", globals[i].v.svalue);
- puts ("};");
- puts ("#endif");
- puts ("#define Qnil builtin_lisp_symbol (0)");
- puts ("#if DEFINE_NON_NIL_Q_SYMBOL_MACROS");
- num_symbols = 0;
- for (ptrdiff_t i = 0; i < num_globals; i++)
- if (globals[i].type == SYMBOL && num_symbols++ != 0)
- printf ("# define %s builtin_lisp_symbol (%td)\n",
- globals[i].name, num_symbols - 1);
- puts ("#endif");
- }
- /* Read through a c file. If a .o file is named,
- the corresponding .c or .m file is read instead.
- Looks for DEFUN constructs such as are defined in ../src/lisp.h.
- Accepts any word starting DEF... so it finds DEFSIMPLE and DEFPRED. */
- static void
- scan_c_file (char *filename, const char *mode)
- {
- FILE *infile;
- char extension = filename[strlen (filename) - 1];
- if (extension == 'o')
- filename[strlen (filename) - 1] = 'c';
- infile = fopen (filename, mode);
- if (infile == NULL && extension == 'o')
- {
- /* Try .m. */
- filename[strlen (filename) - 1] = 'm';
- infile = fopen (filename, mode);
- if (infile == NULL)
- filename[strlen (filename) - 1] = 'c'; /* Don't confuse people. */
- }
- if (infile == NULL)
- {
- perror (filename);
- exit (EXIT_FAILURE);
- }
- /* Reset extension to be able to detect duplicate files. */
- filename[strlen (filename) - 1] = extension;
- scan_c_stream (infile);
- }
- /* Return 1 if next input from INFILE is equal to P, -1 if EOF,
- 0 if input doesn't match. */
- static int
- stream_match (FILE *infile, const char *p)
- {
- for (; *p; p++)
- {
- int c = getc (infile);
- if (c == EOF)
- return -1;
- if (c != *p)
- return 0;
- }
- return 1;
- }
- static void
- scan_c_stream (FILE *infile)
- {
- int commas, minargs, maxargs;
- int c = '\n';
- while (!feof (infile))
- {
- bool doc_keyword = false;
- bool defunflag = false;
- bool defvarperbufferflag = false;
- bool defvarflag = false;
- enum global_type type = INVALID;
- static char *name;
- static ptrdiff_t name_size;
- if (c != '\n' && c != '\r')
- {
- c = getc (infile);
- continue;
- }
- c = getc (infile);
- if (c == ' ')
- {
- while (c == ' ')
- c = getc (infile);
- if (c != 'D')
- continue;
- c = getc (infile);
- if (c != 'E')
- continue;
- c = getc (infile);
- if (c != 'F')
- continue;
- c = getc (infile);
- if (c == 'S')
- {
- c = getc (infile);
- if (c != 'Y')
- continue;
- c = getc (infile);
- if (c != 'M')
- continue;
- c = getc (infile);
- if (c != ' ' && c != '\t' && c != '(')
- continue;
- type = SYMBOL;
- }
- else if (c == 'V')
- {
- c = getc (infile);
- if (c != 'A')
- continue;
- c = getc (infile);
- if (c != 'R')
- continue;
- c = getc (infile);
- if (c != '_')
- continue;
- defvarflag = true;
- c = getc (infile);
- defvarperbufferflag = (c == 'P');
- if (generate_globals)
- {
- if (c == 'I')
- type = EMACS_INTEGER;
- else if (c == 'L')
- type = LISP_OBJECT;
- else if (c == 'B')
- type = BOOLEAN;
- }
- c = getc (infile);
- /* We need to distinguish between DEFVAR_BOOL and
- DEFVAR_BUFFER_DEFAULTS. */
- if (generate_globals && type == BOOLEAN && c != 'O')
- type = INVALID;
- }
- else
- continue;
- }
- else if (c == 'D')
- {
- c = getc (infile);
- if (c != 'E')
- continue;
- c = getc (infile);
- if (c != 'F')
- continue;
- c = getc (infile);
- defunflag = c == 'U';
- }
- else continue;
- if (generate_globals
- && (!defvarflag || defvarperbufferflag || type == INVALID)
- && !defunflag && type != SYMBOL)
- continue;
- while (c != '(')
- {
- if (c < 0)
- goto eof;
- c = getc (infile);
- }
- if (type != SYMBOL)
- {
- /* Lisp variable or function name. */
- c = getc (infile);
- if (c != '"')
- continue;
- c = read_c_string_or_comment (infile, -1, false, 0);
- }
- if (generate_globals)
- {
- ptrdiff_t i = 0;
- char const *svalue = 0;
- /* Skip "," and whitespace. */
- do
- {
- c = getc (infile);
- }
- while (c == ',' || c == ' ' || c == '\t' || c == '\n' || c == '\r');
- /* Read in the identifier. */
- do
- {
- if (c < 0)
- goto eof;
- input_buffer[i++] = c;
- c = getc (infile);
- }
- while (! (c == ',' || c == ' ' || c == '\t'
- || c == '\n' || c == '\r'));
- input_buffer[i] = '\0';
- if (name_size <= i)
- {
- free (name);
- name_size = i + 1;
- ptrdiff_t doubled;
- if (! INT_MULTIPLY_WRAPV (name_size, 2, &doubled)
- && doubled <= SIZE_MAX)
- name_size = doubled;
- name = xmalloc (name_size);
- }
- memcpy (name, input_buffer, i + 1);
- if (type == SYMBOL)
- {
- do
- c = getc (infile);
- while (c == ' ' || c == '\t' || c == '\n' || c == '\r');
- if (c != '"')
- continue;
- c = read_c_string_or_comment (infile, -1, false, 0);
- svalue = input_buffer;
- }
- if (!defunflag)
- {
- add_global (type, name, 0, svalue);
- continue;
- }
- }
- if (type == SYMBOL)
- continue;
- /* DEFVAR_LISP ("name", addr, "doc")
- DEFVAR_LISP ("name", addr /\* doc *\/)
- DEFVAR_LISP ("name", addr, doc: /\* doc *\/) */
- if (defunflag)
- commas = generate_globals ? 4 : 5;
- else if (defvarperbufferflag)
- commas = 3;
- else if (defvarflag)
- commas = 1;
- else /* For DEFSIMPLE and DEFPRED. */
- commas = 2;
- while (commas)
- {
- if (c == ',')
- {
- commas--;
- if (defunflag && (commas == 1 || commas == 2))
- {
- int scanned = 0;
- do
- c = getc (infile);
- while (c == ' ' || c == '\n' || c == '\r' || c == '\t');
- if (c < 0)
- goto eof;
- ungetc (c, infile);
- if (commas == 2) /* Pick up minargs. */
- scanned = fscanf (infile, "%d", &minargs);
- else /* Pick up maxargs. */
- if (c == 'M' || c == 'U') /* MANY || UNEVALLED */
- {
- if (generate_globals)
- maxargs = (c == 'M') ? -1 : -2;
- else
- maxargs = -1;
- }
- else
- scanned = fscanf (infile, "%d", &maxargs);
- if (scanned < 0)
- goto eof;
- }
- }
- if (c == EOF)
- goto eof;
- c = getc (infile);
- }
- if (generate_globals)
- {
- struct global *g = add_global (FUNCTION, name, maxargs, 0);
- if (!g)
- continue;
- /* The following code tries to recognize function attributes
- specified after the docstring, e.g.:
- DEFUN ("foo", Ffoo, Sfoo, X, Y, Z,
- doc: /\* doc *\/
- attributes: attribute1 attribute2 ...)
- (Lisp_Object arg...)
- Now only 'noreturn' and 'const' attributes are used. */
- /* Advance to the end of docstring. */
- c = getc (infile);
- if (c == EOF)
- goto eof;
- int d = getc (infile);
- if (d == EOF)
- goto eof;
- while (1)
- {
- if (c == '*' && d == '/')
- break;
- c = d, d = getc (infile);
- if (d == EOF)
- goto eof;
- }
- /* Skip spaces, if any. */
- do
- {
- c = getc (infile);
- if (c == EOF)
- goto eof;
- }
- while (c == ' ' || c == '\n' || c == '\r' || c == '\t');
- /* Check for 'attributes:' token. */
- if (c == 'a' && stream_match (infile, "ttributes:"))
- {
- char *p = input_buffer;
- /* Collect attributes up to ')'. */
- while (1)
- {
- c = getc (infile);
- if (c == EOF)
- goto eof;
- if (c == ')')
- break;
- if (p - input_buffer > sizeof (input_buffer))
- abort ();
- *p++ = c;
- }
- *p = 0;
- if (strstr (input_buffer, "noreturn"))
- g->flags |= DEFUN_noreturn;
- if (strstr (input_buffer, "const"))
- g->flags |= DEFUN_const;
- }
- continue;
- }
- while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
- c = getc (infile);
- if (c == '"')
- c = read_c_string_or_comment (infile, 0, false, 0);
- while (c != EOF && c != ',' && c != '/')
- c = getc (infile);
- if (c == ',')
- {
- c = getc (infile);
- while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
- c = getc (infile);
- while ((c >= 'a' && c <= 'z') || (c >= 'Z' && c <= 'Z'))
- c = getc (infile);
- if (c == ':')
- {
- doc_keyword = true;
- c = getc (infile);
- while (c == ' ' || c == '\n' || c == '\r' || c == '\t')
- c = getc (infile);
- }
- }
- if (c == '"'
- || (c == '/'
- && (c = getc (infile),
- ungetc (c, infile),
- c == '*')))
- {
- bool comment = c != '"';
- bool saw_usage;
- printf ("\037%c%s\n", defvarflag ? 'V' : 'F', input_buffer);
- if (comment)
- getc (infile); /* Skip past `*'. */
- c = read_c_string_or_comment (infile, 1, comment, &saw_usage);
- /* If this is a defun, find the arguments and print them. If
- this function takes MANY or UNEVALLED args, then the C source
- won't give the names of the arguments, so we shouldn't bother
- trying to find them.
- Various doc-string styles:
- 0: DEFUN (..., "DOC") (args) [!comment]
- 1: DEFUN (..., /\* DOC *\/ (args)) [comment && !doc_keyword]
- 2: DEFUN (..., doc: /\* DOC *\/) (args) [comment && doc_keyword]
- */
- if (defunflag && maxargs != -1 && !saw_usage)
- {
- char argbuf[1024], *p = argbuf;
- if (!comment || doc_keyword)
- while (c != ')')
- {
- if (c < 0)
- goto eof;
- c = getc (infile);
- }
- /* Skip into arguments. */
- while (c != '(')
- {
- if (c < 0)
- goto eof;
- c = getc (infile);
- }
- /* Copy arguments into ARGBUF. */
- *p++ = c;
- do
- *p++ = c = getc (infile);
- while (c != ')');
- *p = '\0';
- /* Output them. */
- fputs ("\n\n", stdout);
- write_c_args (input_buffer, argbuf, minargs, maxargs);
- }
- else if (defunflag && maxargs == -1 && !saw_usage)
- /* The DOC should provide the usage form. */
- fprintf (stderr, "Missing 'usage' for function '%s'.\n",
- input_buffer);
- }
- }
- eof:
- if (ferror (infile) || fclose (infile) != 0)
- fatal ("read error");
- }
- /* Read a file of Lisp code, compiled or interpreted.
- Looks for
- (defun NAME ARGS DOCSTRING ...)
- (defmacro NAME ARGS DOCSTRING ...)
- (defsubst NAME ARGS DOCSTRING ...)
- (autoload (quote NAME) FILE DOCSTRING ...)
- (defvar NAME VALUE DOCSTRING)
- (defconst NAME VALUE DOCSTRING)
- (fset (quote NAME) (make-byte-code ... DOCSTRING ...))
- (fset (quote NAME) #[... DOCSTRING ...])
- (defalias (quote NAME) #[... DOCSTRING ...])
- (custom-declare-variable (quote NAME) VALUE DOCSTRING ...)
- starting in column zero.
- (quote NAME) may appear as 'NAME as well.
- We also look for #@LENGTH CONTENTS^_ at the beginning of the line.
- When we find that, we save it for the following defining-form,
- and we use that instead of reading a doc string within that defining-form.
- For defvar, defconst, and fset we skip to the docstring with a kludgy
- formatting convention: all docstrings must appear on the same line as the
- initial open-paren (the one in column zero) and must contain a backslash
- and a newline immediately after the initial double-quote. No newlines
- must appear between the beginning of the form and the first double-quote.
- For defun, defmacro, and autoload, we know how to skip over the
- arglist, but the doc string must still have a backslash and newline
- immediately after the double quote.
- The only source files that must follow this convention are preloaded
- uncompiled ones like loaddefs.el; aside from that, it is always the .elc
- file that we should look at, and they are no problem because byte-compiler
- output follows this convention.
- The NAME and DOCSTRING are output.
- NAME is preceded by `F' for a function or `V' for a variable.
- An entry is output only if DOCSTRING has \ newline just after the opening ".
- */
- static void
- skip_white (FILE *infile)
- {
- char c = ' ';
- while (c == ' ' || c == '\t' || c == '\n' || c == '\r')
- c = getc (infile);
- ungetc (c, infile);
- }
- static void
- read_lisp_symbol (FILE *infile, char *buffer)
- {
- char c;
- char *fillp = buffer;
- skip_white (infile);
- while (1)
- {
- c = getc (infile);
- if (c == '\\')
- *(++fillp) = getc (infile);
- else if (c == ' ' || c == '\t' || c == '\n' || c == '\r' || c == '(' || c == ')')
- {
- ungetc (c, infile);
- *fillp = 0;
- break;
- }
- else
- *fillp++ = c;
- }
- if (! buffer[0])
- fprintf (stderr, "## expected a symbol, got '%c'\n", c);
- skip_white (infile);
- }
- static bool
- search_lisp_doc_at_eol (FILE *infile)
- {
- int c = 0, c1 = 0, c2 = 0;
- /* Skip until the end of line; remember two previous chars. */
- while (c != '\n' && c != '\r' && c != EOF)
- {
- c2 = c1;
- c1 = c;
- c = getc (infile);
- }
- /* If two previous characters were " and \,
- this is a doc string. Otherwise, there is none. */
- if (c2 != '"' || c1 != '\\')
- {
- #ifdef DEBUG
- fprintf (stderr, "## non-docstring found\n");
- #endif
- ungetc (c, infile);
- return false;
- }
- return true;
- }
- #define DEF_ELISP_FILE(fn) { #fn, sizeof(#fn) - 1 }
- static void
- scan_lisp_file (const char *filename, const char *mode)
- {
- FILE *infile;
- int c;
- char *saved_string = 0;
- /* These are the only files that are loaded uncompiled, and must
- follow the conventions of the doc strings expected by this
- function. These conventions are automatically followed by the
- byte compiler when it produces the .elc files. */
- static struct {
- const char *fn;
- int fl;
- } const uncompiled[] = {
- DEF_ELISP_FILE (loaddefs.el),
- DEF_ELISP_FILE (loadup.el),
- DEF_ELISP_FILE (charprop.el),
- DEF_ELISP_FILE (cp51932.el),
- DEF_ELISP_FILE (eucjp-ms.el)
- };
- int i;
- int flen = strlen (filename);
- if (generate_globals)
- fatal ("scanning lisp file when -g specified");
- if (flen > 3 && !strcmp (filename + flen - 3, ".el"))
- {
- bool match = false;
- for (i = 0; i < sizeof (uncompiled) / sizeof (uncompiled[0]); i++)
- {
- if (uncompiled[i].fl <= flen
- && !strcmp (filename + flen - uncompiled[i].fl, uncompiled[i].fn)
- && (flen == uncompiled[i].fl
- || IS_SLASH (filename[flen - uncompiled[i].fl - 1])))
- {
- match = true;
- break;
- }
- }
- if (!match)
- fatal ("uncompiled lisp file %s is not supported", filename);
- }
- infile = fopen (filename, mode);
- if (infile == NULL)
- {
- perror (filename);
- exit (EXIT_FAILURE);
- }
- c = '\n';
- while (!feof (infile))
- {
- char buffer[BUFSIZ];
- char type;
- /* If not at end of line, skip till we get to one. */
- if (c != '\n' && c != '\r')
- {
- c = getc (infile);
- continue;
- }
- /* Skip the line break. */
- while (c == '\n' || c == '\r')
- c = getc (infile);
- /* Detect a dynamic doc string and save it for the next expression. */
- if (c == '#')
- {
- c = getc (infile);
- if (c == '@')
- {
- ptrdiff_t length = 0;
- ptrdiff_t i;
- /* Read the length. */
- while ((c = getc (infile),
- c >= '0' && c <= '9'))
- {
- if (INT_MULTIPLY_WRAPV (length, 10, &length)
- || INT_ADD_WRAPV (length, c - '0', &length)
- || SIZE_MAX < length)
- memory_exhausted ();
- }
- if (length <= 1)
- fatal ("invalid dynamic doc string length");
- if (c != ' ')
- fatal ("space not found after dynamic doc string length");
- /* The next character is a space that is counted in the length
- but not part of the doc string.
- We already read it, so just ignore it. */
- length--;
- /* Read in the contents. */
- free (saved_string);
- saved_string = xmalloc (length);
- for (i = 0; i < length; i++)
- saved_string[i] = getc (infile);
- /* The last character is a ^_.
- That is needed in the .elc file
- but it is redundant in DOC. So get rid of it here. */
- saved_string[length - 1] = 0;
- /* Skip the line break. */
- while (c == '\n' || c == '\r')
- c = getc (infile);
- /* Skip the following line. */
- while (c != '\n' && c != '\r')
- c = getc (infile);
- }
- continue;
- }
- if (c != '(')
- continue;
- read_lisp_symbol (infile, buffer);
- if (! strcmp (buffer, "defun")
- || ! strcmp (buffer, "defmacro")
- || ! strcmp (buffer, "defsubst"))
- {
- type = 'F';
- read_lisp_symbol (infile, buffer);
- /* Skip the arguments: either "nil" or a list in parens. */
- c = getc (infile);
- if (c == 'n') /* nil */
- {
- if ((c = getc (infile)) != 'i'
- || (c = getc (infile)) != 'l')
- {
- fprintf (stderr, "## unparsable arglist in %s (%s)\n",
- buffer, filename);
- continue;
- }
- }
- else if (c != '(')
- {
- fprintf (stderr, "## unparsable arglist in %s (%s)\n",
- buffer, filename);
- continue;
- }
- else
- while (c != ')')
- c = getc (infile);
- skip_white (infile);
- /* If the next three characters aren't `dquote bslash newline'
- then we're not reading a docstring.
- */
- if ((c = getc (infile)) != '"'
- || (c = getc (infile)) != '\\'
- || ((c = getc (infile)) != '\n' && c != '\r'))
- {
- #ifdef DEBUG
- fprintf (stderr, "## non-docstring in %s (%s)\n",
- buffer, filename);
- #endif
- continue;
- }
- }
- /* defcustom can only occur in uncompiled Lisp files. */
- else if (! strcmp (buffer, "defvar")
- || ! strcmp (buffer, "defconst")
- || ! strcmp (buffer, "defcustom"))
- {
- type = 'V';
- read_lisp_symbol (infile, buffer);
- if (saved_string == 0)
- if (!search_lisp_doc_at_eol (infile))
- continue;
- }
- else if (! strcmp (buffer, "custom-declare-variable")
- || ! strcmp (buffer, "defvaralias")
- )
- {
- type = 'V';
- c = getc (infile);
- if (c == '\'')
- read_lisp_symbol (infile, buffer);
- else
- {
- if (c != '(')
- {
- fprintf (stderr,
- "## unparsable name in custom-declare-variable in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- if (strcmp (buffer, "quote"))
- {
- fprintf (stderr,
- "## unparsable name in custom-declare-variable in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- c = getc (infile);
- if (c != ')')
- {
- fprintf (stderr,
- "## unparsable quoted name in custom-declare-variable in %s\n",
- filename);
- continue;
- }
- }
- if (saved_string == 0)
- if (!search_lisp_doc_at_eol (infile))
- continue;
- }
- else if (! strcmp (buffer, "fset") || ! strcmp (buffer, "defalias"))
- {
- type = 'F';
- c = getc (infile);
- if (c == '\'')
- read_lisp_symbol (infile, buffer);
- else
- {
- if (c != '(')
- {
- fprintf (stderr, "## unparsable name in fset in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- if (strcmp (buffer, "quote"))
- {
- fprintf (stderr, "## unparsable name in fset in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- c = getc (infile);
- if (c != ')')
- {
- fprintf (stderr,
- "## unparsable quoted name in fset in %s\n",
- filename);
- continue;
- }
- }
- if (saved_string == 0)
- if (!search_lisp_doc_at_eol (infile))
- continue;
- }
- else if (! strcmp (buffer, "autoload"))
- {
- type = 'F';
- c = getc (infile);
- if (c == '\'')
- read_lisp_symbol (infile, buffer);
- else
- {
- if (c != '(')
- {
- fprintf (stderr, "## unparsable name in autoload in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- if (strcmp (buffer, "quote"))
- {
- fprintf (stderr, "## unparsable name in autoload in %s\n",
- filename);
- continue;
- }
- read_lisp_symbol (infile, buffer);
- c = getc (infile);
- if (c != ')')
- {
- fprintf (stderr,
- "## unparsable quoted name in autoload in %s\n",
- filename);
- continue;
- }
- }
- skip_white (infile);
- if ((c = getc (infile)) != '\"')
- {
- fprintf (stderr, "## autoload of %s unparsable (%s)\n",
- buffer, filename);
- continue;
- }
- read_c_string_or_comment (infile, 0, false, 0);
- if (saved_string == 0)
- if (!search_lisp_doc_at_eol (infile))
- continue;
- }
- #ifdef DEBUG
- else if (! strcmp (buffer, "if")
- || ! strcmp (buffer, "byte-code"))
- continue;
- #endif
- else
- {
- #ifdef DEBUG
- fprintf (stderr, "## unrecognized top-level form, %s (%s)\n",
- buffer, filename);
- #endif
- continue;
- }
- /* At this point, we should either use the previous dynamic doc string in
- saved_string or gobble a doc string from the input file.
- In the latter case, the opening quote (and leading backslash-newline)
- have already been read. */
- printf ("\037%c%s\n", type, buffer);
- if (saved_string)
- {
- fputs (saved_string, stdout);
- /* Don't use one dynamic doc string twice. */
- free (saved_string);
- saved_string = 0;
- }
- else
- read_c_string_or_comment (infile, 1, false, 0);
- }
- free (saved_string);
- if (ferror (infile) || fclose (infile) != 0)
- fatal ("%s: read error", filename);
- }
- /* make-docfile.c ends here */
|