123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794 |
- /* Copyright (C) 1995,1996,1997, 1999, 2000, 2002 Free Software Foundation, Inc.
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2, or (at your option)
- * any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this software; see the file COPYING. If not, write to
- * the Free Software Foundation, Inc., 59 Temple Place, Suite 330,
- * Boston, MA 02111-1307 USA
- *
- * As a special exception, the Free Software Foundation gives permission
- * for additional uses of the text contained in its release of GUILE.
- *
- * The exception is that, if you link the GUILE library with other files
- * to produce an executable, this does not by itself cause the
- * resulting executable to be covered by the GNU General Public License.
- * Your use of that executable is in no way restricted on account of
- * linking the GUILE library code into it.
- *
- * This exception does not however invalidate any other reasons why
- * the executable file might be covered by the GNU General Public License.
- *
- * This exception applies only to the code released by the
- * Free Software Foundation under the name GUILE. If you copy
- * code from other Free Software Foundation releases into a copy of
- * GUILE, as the General Public License permits, the exception does
- * not apply to the code that you add in this way. To avoid misleading
- * anyone as to the status of such modified files, you must delete
- * this exception notice from them.
- *
- * If you write modifications of your own for GUILE, it is your choice
- * whether to permit this exception to apply to your modifications.
- * If you do not wish that, delete this exception notice. */
- #include <stdio.h>
- #include "libguile/_scm.h"
- #include "libguile/chars.h"
- #include "libguile/eval.h"
- #include "libguile/unif.h"
- #include "libguile/keywords.h"
- #include "libguile/alist.h"
- #include "libguile/srcprop.h"
- #include "libguile/hashtab.h"
- #include "libguile/hash.h"
- #include "libguile/ports.h"
- #include "libguile/root.h"
- #include "libguile/strings.h"
- #include "libguile/vectors.h"
- #include "libguile/validate.h"
- #include "libguile/read.h"
- SCM_SYMBOL (scm_keyword_prefix, "prefix");
- scm_option scm_read_opts[] = {
- { SCM_OPTION_BOOLEAN, "copy", 0,
- "Copy source code expressions." },
- { SCM_OPTION_BOOLEAN, "positions", 0,
- "Record positions of source code expressions." },
- { SCM_OPTION_BOOLEAN, "case-insensitive", 0,
- "Convert symbols to lower case."},
- { SCM_OPTION_SCM, "keywords", SCM_UNPACK (SCM_BOOL_F),
- "Style of keyword recognition: #f or 'prefix"}
- };
- SCM_DEFINE (scm_read_options, "read-options-interface", 0, 1, 0,
- (SCM setting),
- "")
- #define FUNC_NAME s_scm_read_options
- {
- SCM ans = scm_options (setting,
- scm_read_opts,
- SCM_N_READ_OPTIONS,
- FUNC_NAME);
- if (SCM_COPY_SOURCE_P)
- SCM_RECORD_POSITIONS_P = 1;
- return ans;
- }
- #undef FUNC_NAME
- /* An association list mapping extra hash characters to procedures. */
- static SCM *scm_read_hash_procedures;
- SCM_DEFINE (scm_read, "read", 0, 1, 0,
- (SCM port),
- "")
- #define FUNC_NAME s_scm_read
- {
- int c;
- SCM tok_buf, copy;
- if (SCM_UNBNDP (port))
- port = scm_cur_inp;
- SCM_VALIDATE_OPINPORT (1,port);
- c = scm_flush_ws (port, (char *) NULL);
- if (EOF == c)
- return SCM_EOF_VAL;
- scm_ungetc (c, port);
- tok_buf = scm_makstr (30L, 0);
- return scm_lreadr (&tok_buf, port, ©);
- }
- #undef FUNC_NAME
- char *
- scm_grow_tok_buf (SCM *tok_buf)
- {
- scm_vector_set_length_x (*tok_buf, SCM_MAKINUM (2 * SCM_LENGTH (*tok_buf)));
- return SCM_CHARS (*tok_buf);
- }
- int
- scm_flush_ws (SCM port, const char *eoferr)
- {
- register int c;
- while (1)
- switch (c = scm_getc (port))
- {
- case EOF:
- goteof:
- if (eoferr)
- scm_wta (SCM_UNDEFINED, "end of file in ", eoferr);
- return c;
- case ';':
- lp:
- switch (c = scm_getc (port))
- {
- case EOF:
- goto goteof;
- default:
- goto lp;
- case SCM_LINE_INCREMENTORS:
- break;
- }
- break;
- case SCM_LINE_INCREMENTORS:
- case SCM_SINGLE_SPACES:
- case '\t':
- break;
- default:
- return c;
- }
- }
- int
- scm_casei_streq (char *s1, char *s2)
- {
- while (*s1 && *s2)
- if (scm_downcase((int)*s1) != scm_downcase((int)*s2))
- return 0;
- else
- {
- ++s1;
- ++s2;
- }
- return !(*s1 || *s2);
- }
- /* recsexpr is used when recording expressions
- * constructed by read:sharp.
- */
- #ifndef DEBUG_EXTENSIONS
- #define recsexpr(obj, line, column, filename) (obj)
- #else
- static SCM
- recsexpr (SCM obj,int line,int column,SCM filename)
- {
- if (!SCM_CONSP(obj)) {
- return obj;
- } else {
- SCM tmp = obj, copy;
- /* If this sexpr is visible in the read:sharp source, we want to
- keep that information, so only record non-constant cons cells
- which haven't previously been read by the reader. */
- if (SCM_FALSEP (scm_whash_lookup (scm_source_whash, obj)))
- {
- if (SCM_COPY_SOURCE_P)
- {
- copy = scm_cons (recsexpr (SCM_CAR (obj), line, column, filename),
- SCM_UNDEFINED);
- while ((tmp = SCM_CDR (tmp)) && SCM_CONSP (tmp))
- {
- SCM_SETCDR (copy, scm_cons (recsexpr (SCM_CAR (tmp),
- line,
- column,
- filename),
- SCM_UNDEFINED));
- copy = SCM_CDR (copy);
- }
- SCM_SETCDR (copy, tmp);
- }
- else
- {
- recsexpr (SCM_CAR (obj), line, column, filename);
- while ((tmp = SCM_CDR (tmp)) && SCM_CONSP (tmp))
- recsexpr (SCM_CAR (tmp), line, column, filename);
- copy = SCM_UNDEFINED;
- }
- scm_whash_insert (scm_source_whash,
- obj,
- scm_make_srcprops (line,
- column,
- filename,
- copy,
- SCM_EOL));
- }
- return obj;
- }
- }
- #endif
- /* Consume an SCSH-style block comment. Assume that we've already
- read the initial `#!', and eat characters until we get a
- newline/exclamation-point/sharp-sign/newline sequence. */
- static void
- skip_scsh_block_comment (SCM port)
- {
- /* Is this portable? Dear God, spare me from the non-eight-bit
- characters. But is it tasteful? */
- long history = 0;
- for (;;)
- {
- int c = scm_getc (port);
- if (c == EOF)
- scm_wta (SCM_UNDEFINED,
- "unterminated `#! ... !#' comment", "read");
- history = ((history << 8) | (c & 0xff)) & 0xffffffff;
- /* Were the last four characters read "\n!#\n"? */
- if (history == (('\n' << 24) | ('!' << 16) | ('#' << 8) | '\n'))
- return;
- }
- }
- static SCM scm_get_hash_procedure(int c);
- static char s_list[]="list";
- SCM
- scm_lreadr (SCM *tok_buf,SCM port,SCM *copy)
- {
- int c;
- scm_sizet j;
- SCM p;
-
- tryagain:
- c = scm_flush_ws (port, s_scm_read);
- tryagain_no_flush_ws:
- switch (c)
- {
- case EOF:
- return SCM_EOF_VAL;
- case '(':
- return SCM_RECORD_POSITIONS_P
- ? scm_lreadrecparen (tok_buf, port, s_list, copy)
- : scm_lreadparen (tok_buf, port, s_list, copy);
- case ')':
- scm_wta (SCM_UNDEFINED, "unexpected \")\"", "read");
- goto tryagain;
-
- case '\'':
- p = scm_sym_quote;
- goto recquote;
- case '`':
- p = scm_sym_quasiquote;
- goto recquote;
- case ',':
- c = scm_getc (port);
- if ('@' == c)
- p = scm_sym_uq_splicing;
- else
- {
- scm_ungetc (c, port);
- p = scm_sym_unquote;
- }
- recquote:
- p = scm_cons2 (p,
- scm_lreadr (tok_buf, port, copy),
- SCM_EOL);
- if (SCM_RECORD_POSITIONS_P)
- scm_whash_insert (scm_source_whash,
- p,
- scm_make_srcprops (SCM_LINUM (port),
- SCM_COL (port) - 1,
- SCM_FILENAME (port),
- SCM_COPY_SOURCE_P
- ? (*copy = scm_cons2 (SCM_CAR (p),
- SCM_CAR (SCM_CDR (p)),
- SCM_EOL))
- : SCM_UNDEFINED,
- SCM_EOL));
- return p;
- case '#':
- c = scm_getc (port);
- switch (c)
- {
- case '(':
- p = scm_lreadparen (tok_buf, port, "vector", copy);
- return SCM_NULLP (p) ? scm_nullvect : scm_vector (p);
- case 't':
- case 'T':
- return SCM_BOOL_T;
- case 'f':
- case 'F':
- return SCM_BOOL_F;
- case 'b':
- case 'B':
- case 'o':
- case 'O':
- case 'd':
- case 'D':
- case 'x':
- case 'X':
- case 'i':
- case 'I':
- case 'e':
- case 'E':
- scm_ungetc (c, port);
- c = '#';
- goto num;
- case '!':
- /* start of a shell script. Parse as a block comment,
- terminated by !#, just like SCSH. */
- skip_scsh_block_comment (port);
- /* EOF is not an error here */
- c = scm_flush_ws (port, (char *)NULL);
- goto tryagain_no_flush_ws;
- #ifdef HAVE_ARRAYS
- case '*':
- j = scm_read_token (c, tok_buf, port, 0);
- p = scm_istr2bve (SCM_CHARS (*tok_buf) + 1, (long) (j - 1));
- if (SCM_NFALSEP (p))
- return p;
- else
- goto unkshrp;
- #endif
- case '{':
- j = scm_read_token (c, tok_buf, port, 1);
- p = scm_intern (SCM_CHARS (*tok_buf), j);
- return SCM_CAR (p);
- case '\\':
- c = scm_getc (port);
- j = scm_read_token (c, tok_buf, port, 0);
- if (j == 1)
- return SCM_MAKE_CHAR (c);
- if (c >= '0' && c < '8')
- {
- p = scm_istr2int (SCM_CHARS (*tok_buf), (long) j, 8);
- if (SCM_NFALSEP (p))
- return SCM_MAKE_CHAR (SCM_INUM (p));
- }
- for (c = 0; c < scm_n_charnames; c++)
- if (scm_charnames[c]
- && (scm_casei_streq (scm_charnames[c], SCM_CHARS (*tok_buf))))
- return SCM_MAKE_CHAR (scm_charnums[c]);
- scm_wta (SCM_UNDEFINED, "unknown # object: #\\", SCM_CHARS (*tok_buf));
- /* #:SYMBOL is a syntax for keywords supported in all contexts. */
- case ':':
- j = scm_read_token ('-', tok_buf, port, 0);
- p = scm_intern (SCM_CHARS (*tok_buf), j);
- return scm_make_keyword_from_dash_symbol (SCM_CAR (p));
- default:
- callshrp:
- {
- SCM sharp = scm_get_hash_procedure (c);
- if (SCM_NIMP (sharp))
- {
- int line = SCM_LINUM (port);
- int column = SCM_COL (port) - 2;
- SCM got;
- got = scm_apply (sharp,
- SCM_MAKE_CHAR (c),
- scm_acons (port, SCM_EOL, SCM_EOL));
- if (SCM_EQ_P (got, SCM_UNSPECIFIED))
- goto unkshrp;
- if (SCM_RECORD_POSITIONS_P)
- return *copy = recsexpr (got, line, column,
- SCM_FILENAME (port));
- else
- return got;
- }
- }
- unkshrp:
- scm_misc_error (s_scm_read, "Unknown # object: ~S",
- scm_listify (SCM_MAKE_CHAR (c), SCM_UNDEFINED));
- }
- case '"':
- j = 0;
- while ('"' != (c = scm_getc (port)))
- {
- SCM_ASSERT (EOF != c, SCM_UNDEFINED, "end of file in ", "string");
- while (j + 2 >= SCM_LENGTH (*tok_buf))
- scm_grow_tok_buf (tok_buf);
- if (c == '\\')
- switch (c = scm_getc (port))
- {
- case '\n':
- continue;
- case '0':
- c = '\0';
- break;
- case 'f':
- c = '\f';
- break;
- case 'n':
- c = '\n';
- break;
- case 'r':
- c = '\r';
- break;
- case 't':
- c = '\t';
- break;
- case 'a':
- c = '\007';
- break;
- case 'v':
- c = '\v';
- break;
- }
- SCM_CHARS (*tok_buf)[j] = c;
- ++j;
- }
- if (j == 0)
- return scm_nullstr;
- SCM_CHARS (*tok_buf)[j] = 0;
- {
- SCM str;
- str = scm_makfromstr (SCM_CHARS (*tok_buf), j, 0);
- return str;
- }
- case'0':case '1':case '2':case '3':case '4':
- case '5':case '6':case '7':case '8':case '9':
- case '.':
- case '-':
- case '+':
- num:
- j = scm_read_token (c, tok_buf, port, 0);
- p = scm_istring2number (SCM_CHARS (*tok_buf), (long) j, 10L);
- if (SCM_NFALSEP (p))
- return p;
- if (c == '#')
- {
- if ((j == 2) && (scm_getc (port) == '('))
- {
- scm_ungetc ('(', port);
- c = SCM_CHARS (*tok_buf)[1];
- goto callshrp;
- }
- scm_wta (SCM_UNDEFINED, "unknown # object", SCM_CHARS (*tok_buf));
- }
- goto tok;
- case ':':
- if (SCM_EQ_P (SCM_PACK (SCM_KEYWORD_STYLE), scm_keyword_prefix))
- {
- j = scm_read_token ('-', tok_buf, port, 0);
- p = scm_intern (SCM_CHARS (*tok_buf), j);
- return scm_make_keyword_from_dash_symbol (SCM_CAR (p));
- }
- /* fallthrough */
- default:
- j = scm_read_token (c, tok_buf, port, 0);
- /* fallthrough */
- tok:
- p = scm_intern (SCM_CHARS (*tok_buf), j);
- return SCM_CAR (p);
- }
- }
- #ifdef _UNICOS
- _Pragma ("noopt"); /* # pragma _CRI noopt */
- #endif
- scm_sizet
- scm_read_token (int ic, SCM *tok_buf, SCM port, int weird)
- {
- register scm_sizet j;
- register int c;
- register char *p;
- c = (SCM_CASE_INSENSITIVE_P ? scm_downcase(ic) : ic);
- p = SCM_CHARS (*tok_buf);
- if (weird)
- j = 0;
- else
- {
- j = 0;
- while (j + 2 >= SCM_LENGTH (*tok_buf))
- p = scm_grow_tok_buf (tok_buf);
- p[j] = c;
- ++j;
- }
- while (1)
- {
- while (j + 2 >= SCM_LENGTH (*tok_buf))
- p = scm_grow_tok_buf (tok_buf);
- c = scm_getc (port);
- switch (c)
- {
- case '(':
- case ')':
- case '"':
- case ';':
- case SCM_WHITE_SPACES:
- case SCM_LINE_INCREMENTORS:
- if (weird)
- goto default_case;
- scm_ungetc (c, port);
- case EOF:
- eof_case:
- p[j] = 0;
- return j;
- case '\\':
- if (!weird)
- goto default_case;
- else
- {
- c = scm_getc (port);
- if (c == EOF)
- goto eof_case;
- else
- goto default_case;
- }
- case '}':
- if (!weird)
- goto default_case;
- c = scm_getc (port);
- if (c == '#')
- {
- p[j] = 0;
- return j;
- }
- else
- {
- scm_ungetc (c, port);
- c = '}';
- goto default_case;
- }
- default:
- default_case:
- {
- c = (SCM_CASE_INSENSITIVE_P ? scm_downcase(c) : c);
- p[j] = c;
- ++j;
- }
- }
- }
- }
- #ifdef _UNICOS
- _Pragma ("opt"); /* # pragma _CRI opt */
- #endif
- SCM
- scm_lreadparen (SCM *tok_buf, SCM port, char *name, SCM *copy)
- {
- SCM tmp;
- SCM tl;
- SCM ans;
- int c;
- c = scm_flush_ws (port, name);
- if (')' == c)
- return SCM_EOL;
- scm_ungetc (c, port);
- if (SCM_EQ_P (scm_sym_dot, (tmp = scm_lreadr (tok_buf, port, copy))))
- {
- ans = scm_lreadr (tok_buf, port, copy);
- closeit:
- if (')' != (c = scm_flush_ws (port, name)))
- scm_wta (SCM_UNDEFINED, "missing close paren", "");
- return ans;
- }
- ans = tl = scm_cons (tmp, SCM_EOL);
- while (')' != (c = scm_flush_ws (port, name)))
- {
- scm_ungetc (c, port);
- if (SCM_EQ_P (scm_sym_dot, (tmp = scm_lreadr (tok_buf, port, copy))))
- {
- SCM_SETCDR (tl, scm_lreadr (tok_buf, port, copy));
- goto closeit;
- }
- SCM_SETCDR (tl, scm_cons (tmp, SCM_EOL));
- tl = SCM_CDR (tl);
- }
- return ans;
- }
- SCM
- scm_lreadrecparen (SCM *tok_buf, SCM port, char *name, SCM *copy)
- {
- register int c;
- register SCM tmp;
- register SCM tl, tl2 = SCM_EOL;
- SCM ans, ans2 = SCM_EOL;
- /* Need to capture line and column numbers here. */
- int line = SCM_LINUM (port);
- int column = SCM_COL (port) - 1;
- c = scm_flush_ws (port, name);
- if (')' == c)
- return SCM_EOL;
- scm_ungetc (c, port);
- if (SCM_EQ_P (scm_sym_dot, (tmp = scm_lreadr (tok_buf, port, copy))))
- {
- ans = scm_lreadr (tok_buf, port, copy);
- if (')' != (c = scm_flush_ws (port, name)))
- scm_wta (SCM_UNDEFINED, "missing close paren", "");
- return ans;
- }
- /* Build the head of the list structure. */
- ans = tl = scm_cons (tmp, SCM_EOL);
- if (SCM_COPY_SOURCE_P)
- ans2 = tl2 = scm_cons (SCM_CONSP (tmp)
- ? *copy
- : tmp,
- SCM_EOL);
- while (')' != (c = scm_flush_ws (port, name)))
- {
- scm_ungetc (c, port);
- if (SCM_EQ_P (scm_sym_dot, (tmp = scm_lreadr (tok_buf, port, copy))))
- {
- SCM_SETCDR (tl, tmp = scm_lreadr (tok_buf, port, copy));
- if (SCM_COPY_SOURCE_P)
- SCM_SETCDR (tl2, scm_cons (SCM_CONSP (tmp)
- ? *copy
- : tmp,
- SCM_EOL));
- if (')' != (c = scm_flush_ws (port, name)))
- scm_wta (SCM_UNDEFINED, "missing close paren", "");
- goto exit;
- }
- tl = SCM_SETCDR (tl, scm_cons (tmp, SCM_EOL));
- if (SCM_COPY_SOURCE_P)
- tl2 = SCM_SETCDR (tl2, scm_cons (SCM_CONSP (tmp)
- ? *copy
- : tmp,
- SCM_EOL));
- }
- exit:
- scm_whash_insert (scm_source_whash,
- ans,
- scm_make_srcprops (line,
- column,
- SCM_FILENAME (port),
- SCM_COPY_SOURCE_P
- ? *copy = ans2
- : SCM_UNDEFINED,
- SCM_EOL));
- return ans;
- }
- /* Manipulate the read-hash-procedures alist. This could be written in
- Scheme, but maybe it will also be used by C code during initialisation. */
- SCM_DEFINE (scm_read_hash_extend, "read-hash-extend", 2, 0, 0,
- (SCM chr, SCM proc),
- "")
- #define FUNC_NAME s_scm_read_hash_extend
- {
- SCM this;
- SCM prev;
- SCM_VALIDATE_CHAR (1,chr);
- SCM_ASSERT (SCM_FALSEP (proc) || SCM_NIMP(proc), proc, SCM_ARG2,
- FUNC_NAME);
- /* Check if chr is already in the alist. */
- this = *scm_read_hash_procedures;
- prev = SCM_BOOL_F;
- while (1)
- {
- if (SCM_NULLP (this))
- {
- /* not found, so add it to the beginning. */
- if (SCM_NFALSEP (proc))
- {
- *scm_read_hash_procedures =
- scm_cons (scm_cons (chr, proc), *scm_read_hash_procedures);
- }
- break;
- }
- if (SCM_EQ_P (chr, SCM_CAAR (this)))
- {
- /* already in the alist. */
- if (SCM_FALSEP (proc))
- {
- /* remove it. */
- if (SCM_FALSEP (prev))
- {
- *scm_read_hash_procedures =
- SCM_CDR (*scm_read_hash_procedures);
- }
- else
- scm_set_cdr_x (prev, SCM_CDR (this));
- }
- else
- {
- /* replace it. */
- scm_set_cdr_x (SCM_CAR (this), proc);
- }
- break;
- }
- prev = this;
- this = SCM_CDR (this);
- }
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* Recover the read-hash procedure corresponding to char c. */
- static SCM
- scm_get_hash_procedure (int c)
- {
- SCM rest = *scm_read_hash_procedures;
- while (1)
- {
- if (SCM_NULLP (rest))
- return SCM_BOOL_F;
-
- if (SCM_CHAR (SCM_CAAR (rest)) == c)
- return SCM_CDAR (rest);
-
- rest = SCM_CDR (rest);
- }
- }
- void
- scm_init_read ()
- {
- scm_read_hash_procedures =
- SCM_CDRLOC (scm_sysintern ("read-hash-procedures", SCM_EOL));
- scm_init_opts (scm_read_options, scm_read_opts, SCM_N_READ_OPTIONS);
- #include "libguile/read.x"
- }
- /*
- Local Variables:
- c-file-style: "gnu"
- End:
- */
|