symbols.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457
  1. /* Copyright (C) 1995,1996,1997,1998,2000,2001, 2003, 2004, 2006, 2009 Free Software Foundation, Inc.
  2. *
  3. * This library is free software; you can redistribute it and/or
  4. * modify it under the terms of the GNU Lesser General Public License
  5. * as published by the Free Software Foundation; either version 3 of
  6. * the License, or (at your option) any later version.
  7. *
  8. * This library is distributed in the hope that it will be useful, but
  9. * WITHOUT ANY WARRANTY; without even the implied warranty of
  10. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  11. * Lesser General Public License for more details.
  12. *
  13. * You should have received a copy of the GNU Lesser General Public
  14. * License along with this library; if not, write to the Free Software
  15. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
  16. * 02110-1301 USA
  17. */
  18. #ifdef HAVE_CONFIG_H
  19. # include <config.h>
  20. #endif
  21. #include "libguile/_scm.h"
  22. #include "libguile/chars.h"
  23. #include "libguile/eval.h"
  24. #include "libguile/hash.h"
  25. #include "libguile/smob.h"
  26. #include "libguile/variable.h"
  27. #include "libguile/alist.h"
  28. #include "libguile/fluids.h"
  29. #include "libguile/strings.h"
  30. #include "libguile/vectors.h"
  31. #include "libguile/hashtab.h"
  32. #include "libguile/weaks.h"
  33. #include "libguile/modules.h"
  34. #include "libguile/read.h"
  35. #include "libguile/srfi-13.h"
  36. #include "libguile/validate.h"
  37. #include "libguile/symbols.h"
  38. #include "libguile/private-options.h"
  39. #ifdef HAVE_STRING_H
  40. #include <string.h>
  41. #endif
  42. static SCM symbols;
  43. #ifdef GUILE_DEBUG
  44. SCM_DEFINE (scm_sys_symbols, "%symbols", 0, 0, 0,
  45. (),
  46. "Return the system symbol obarray.")
  47. #define FUNC_NAME s_scm_sys_symbols
  48. {
  49. return symbols;
  50. }
  51. #undef FUNC_NAME
  52. #endif
  53. /* {Symbols}
  54. */
  55. /* In order to optimize reading speed, this function breaks part of
  56. * the hashtable abstraction. The optimizations are:
  57. *
  58. * 1. The argument string can be compared directly to symbol objects
  59. * without first creating an SCM string object. (This would have
  60. * been necessary if we had used the hashtable API in hashtab.h.)
  61. *
  62. * 2. We can use the raw hash value stored in scm_i_symbol_hash (sym)
  63. * to speed up lookup.
  64. *
  65. * Both optimizations might be possible without breaking the
  66. * abstraction if the API in hashtab.c is improved.
  67. */
  68. unsigned long
  69. scm_i_hash_symbol (SCM obj, unsigned long n, void *closure)
  70. {
  71. return scm_i_symbol_hash (obj) % n;
  72. }
  73. static SCM
  74. lookup_interned_symbol (const char *name, size_t len,
  75. unsigned long raw_hash)
  76. {
  77. /* Try to find the symbol in the symbols table */
  78. SCM l;
  79. unsigned long hash = raw_hash % SCM_HASHTABLE_N_BUCKETS (symbols);
  80. for (l = SCM_HASHTABLE_BUCKET (symbols, hash);
  81. !scm_is_null (l);
  82. l = SCM_CDR (l))
  83. {
  84. SCM sym = SCM_CAAR (l);
  85. if (scm_i_symbol_hash (sym) == raw_hash
  86. && scm_i_symbol_length (sym) == len)
  87. {
  88. const char *chrs = scm_i_symbol_chars (sym);
  89. size_t i = len;
  90. while (i != 0)
  91. {
  92. --i;
  93. if (name[i] != chrs[i])
  94. goto next_symbol;
  95. }
  96. return sym;
  97. }
  98. next_symbol:
  99. ;
  100. }
  101. return SCM_BOOL_F;
  102. }
  103. /* Intern SYMBOL, an uninterned symbol. */
  104. static void
  105. intern_symbol (SCM symbol)
  106. {
  107. SCM slot, cell;
  108. unsigned long hash;
  109. hash = scm_i_symbol_hash (symbol) % SCM_HASHTABLE_N_BUCKETS (symbols);
  110. slot = SCM_HASHTABLE_BUCKET (symbols, hash);
  111. cell = scm_cons (symbol, SCM_UNDEFINED);
  112. SCM_SET_HASHTABLE_BUCKET (symbols, hash, scm_cons (cell, slot));
  113. SCM_HASHTABLE_INCREMENT (symbols);
  114. if (SCM_HASHTABLE_N_ITEMS (symbols) > SCM_HASHTABLE_UPPER (symbols))
  115. scm_i_rehash (symbols, scm_i_hash_symbol, 0, "intern_symbol");
  116. }
  117. static SCM
  118. scm_i_c_mem2symbol (const char *name, size_t len)
  119. {
  120. SCM symbol;
  121. size_t raw_hash = scm_string_hash ((const unsigned char *) name, len);
  122. symbol = lookup_interned_symbol (name, len, raw_hash);
  123. if (scm_is_false (symbol))
  124. {
  125. /* The symbol was not found, create it. */
  126. symbol = scm_i_c_make_symbol (name, len, 0, raw_hash,
  127. scm_cons (SCM_BOOL_F, SCM_EOL));
  128. intern_symbol (symbol);
  129. }
  130. return symbol;
  131. }
  132. static SCM
  133. scm_i_mem2symbol (SCM str)
  134. {
  135. SCM symbol;
  136. const char *name = scm_i_string_chars (str);
  137. size_t len = scm_i_string_length (str);
  138. size_t raw_hash = scm_string_hash ((const unsigned char *) name, len);
  139. symbol = lookup_interned_symbol (name, len, raw_hash);
  140. if (scm_is_false (symbol))
  141. {
  142. /* The symbol was not found, create it. */
  143. symbol = scm_i_make_symbol (str, 0, raw_hash,
  144. scm_cons (SCM_BOOL_F, SCM_EOL));
  145. intern_symbol (symbol);
  146. }
  147. return symbol;
  148. }
  149. static SCM
  150. scm_i_mem2uninterned_symbol (SCM str)
  151. {
  152. const char *name = scm_i_string_chars (str);
  153. size_t len = scm_i_string_length (str);
  154. size_t raw_hash = scm_string_hash ((const unsigned char *) name, len);
  155. return scm_i_make_symbol (str, SCM_I_F_SYMBOL_UNINTERNED,
  156. raw_hash, scm_cons (SCM_BOOL_F, SCM_EOL));
  157. }
  158. SCM_DEFINE (scm_symbol_p, "symbol?", 1, 0, 0,
  159. (SCM obj),
  160. "Return @code{#t} if @var{obj} is a symbol, otherwise return\n"
  161. "@code{#f}.")
  162. #define FUNC_NAME s_scm_symbol_p
  163. {
  164. return scm_from_bool (scm_is_symbol (obj));
  165. }
  166. #undef FUNC_NAME
  167. SCM_DEFINE (scm_symbol_interned_p, "symbol-interned?", 1, 0, 0,
  168. (SCM symbol),
  169. "Return @code{#t} if @var{symbol} is interned, otherwise return\n"
  170. "@code{#f}.")
  171. #define FUNC_NAME s_scm_symbol_interned_p
  172. {
  173. SCM_VALIDATE_SYMBOL (1, symbol);
  174. return scm_from_bool (scm_i_symbol_is_interned (symbol));
  175. }
  176. #undef FUNC_NAME
  177. SCM_DEFINE (scm_make_symbol, "make-symbol", 1, 0, 0,
  178. (SCM name),
  179. "Return a new uninterned symbol with the name @var{name}. "
  180. "The returned symbol is guaranteed to be unique and future "
  181. "calls to @code{string->symbol} will not return it.")
  182. #define FUNC_NAME s_scm_make_symbol
  183. {
  184. SCM_VALIDATE_STRING (1, name);
  185. return scm_i_mem2uninterned_symbol (name);
  186. }
  187. #undef FUNC_NAME
  188. SCM_DEFINE (scm_symbol_to_string, "symbol->string", 1, 0, 0,
  189. (SCM s),
  190. "Return the name of @var{symbol} as a string. If the symbol was\n"
  191. "part of an object returned as the value of a literal expression\n"
  192. "(section @pxref{Literal expressions,,,r5rs, The Revised^5\n"
  193. "Report on Scheme}) or by a call to the @code{read} procedure,\n"
  194. "and its name contains alphabetic characters, then the string\n"
  195. "returned will contain characters in the implementation's\n"
  196. "preferred standard case---some implementations will prefer\n"
  197. "upper case, others lower case. If the symbol was returned by\n"
  198. "@code{string->symbol}, the case of characters in the string\n"
  199. "returned will be the same as the case in the string that was\n"
  200. "passed to @code{string->symbol}. It is an error to apply\n"
  201. "mutation procedures like @code{string-set!} to strings returned\n"
  202. "by this procedure.\n"
  203. "\n"
  204. "The following examples assume that the implementation's\n"
  205. "standard case is lower case:\n"
  206. "\n"
  207. "@lisp\n"
  208. "(symbol->string 'flying-fish) @result{} \"flying-fish\"\n"
  209. "(symbol->string 'Martin) @result{} \"martin\"\n"
  210. "(symbol->string\n"
  211. " (string->symbol \"Malvina\")) @result{} \"Malvina\"\n"
  212. "@end lisp")
  213. #define FUNC_NAME s_scm_symbol_to_string
  214. {
  215. SCM_VALIDATE_SYMBOL (1, s);
  216. return scm_i_symbol_substring (s, 0, scm_i_symbol_length (s));
  217. }
  218. #undef FUNC_NAME
  219. SCM_DEFINE (scm_string_to_symbol, "string->symbol", 1, 0, 0,
  220. (SCM string),
  221. "Return the symbol whose name is @var{string}. This procedure\n"
  222. "can create symbols with names containing special characters or\n"
  223. "letters in the non-standard case, but it is usually a bad idea\n"
  224. "to create such symbols because in some implementations of\n"
  225. "Scheme they cannot be read as themselves. See\n"
  226. "@code{symbol->string}.\n"
  227. "\n"
  228. "The following examples assume that the implementation's\n"
  229. "standard case is lower case:\n"
  230. "\n"
  231. "@lisp\n"
  232. "(eq? 'mISSISSIppi 'mississippi) @result{} #t\n"
  233. "(string->symbol \"mISSISSIppi\") @result{} @r{the symbol with name \"mISSISSIppi\"}\n"
  234. "(eq? 'bitBlt (string->symbol \"bitBlt\")) @result{} #f\n"
  235. "(eq? 'JollyWog\n"
  236. " (string->symbol (symbol->string 'JollyWog))) @result{} #t\n"
  237. "(string=? \"K. Harper, M.D.\"\n"
  238. " (symbol->string\n"
  239. " (string->symbol \"K. Harper, M.D.\"))) @result{}#t\n"
  240. "@end lisp")
  241. #define FUNC_NAME s_scm_string_to_symbol
  242. {
  243. SCM_VALIDATE_STRING (1, string);
  244. return scm_i_mem2symbol (string);
  245. }
  246. #undef FUNC_NAME
  247. SCM_DEFINE (scm_string_ci_to_symbol, "string-ci->symbol", 1, 0, 0,
  248. (SCM str),
  249. "Return the symbol whose name is @var{str}. @var{str} is\n"
  250. "converted to lowercase before the conversion is done, if Guile\n"
  251. "is currently reading symbols case-insensitively.")
  252. #define FUNC_NAME s_scm_string_ci_to_symbol
  253. {
  254. return scm_string_to_symbol (SCM_CASE_INSENSITIVE_P
  255. ? scm_string_downcase(str)
  256. : str);
  257. }
  258. #undef FUNC_NAME
  259. #define MAX_PREFIX_LENGTH 30
  260. SCM_DEFINE (scm_gensym, "gensym", 0, 1, 0,
  261. (SCM prefix),
  262. "Create a new symbol with a name constructed from a prefix and\n"
  263. "a counter value. The string @var{prefix} can be specified as\n"
  264. "an optional argument. Default prefix is @code{ g}. The counter\n"
  265. "is increased by 1 at each call. There is no provision for\n"
  266. "resetting the counter.")
  267. #define FUNC_NAME s_scm_gensym
  268. {
  269. static int gensym_counter = 0;
  270. SCM suffix, name;
  271. int n, n_digits;
  272. char buf[SCM_INTBUFLEN];
  273. if (SCM_UNBNDP (prefix))
  274. prefix = scm_from_locale_string (" g");
  275. /* mutex in case another thread looks and incs at the exact same moment */
  276. scm_i_scm_pthread_mutex_lock (&scm_i_misc_mutex);
  277. n = gensym_counter++;
  278. scm_i_pthread_mutex_unlock (&scm_i_misc_mutex);
  279. n_digits = scm_iint2str (n, 10, buf);
  280. suffix = scm_from_locale_stringn (buf, n_digits);
  281. name = scm_string_append (scm_list_2 (prefix, suffix));
  282. return scm_string_to_symbol (name);
  283. }
  284. #undef FUNC_NAME
  285. SCM_DEFINE (scm_symbol_hash, "symbol-hash", 1, 0, 0,
  286. (SCM symbol),
  287. "Return a hash value for @var{symbol}.")
  288. #define FUNC_NAME s_scm_symbol_hash
  289. {
  290. SCM_VALIDATE_SYMBOL (1, symbol);
  291. return scm_from_ulong (scm_i_symbol_hash (symbol));
  292. }
  293. #undef FUNC_NAME
  294. SCM_DEFINE (scm_symbol_fref, "symbol-fref", 1, 0, 0,
  295. (SCM s),
  296. "Return the contents of @var{symbol}'s @dfn{function slot}.")
  297. #define FUNC_NAME s_scm_symbol_fref
  298. {
  299. SCM_VALIDATE_SYMBOL (1, s);
  300. return SCM_CAR (SCM_CELL_OBJECT_3 (s));
  301. }
  302. #undef FUNC_NAME
  303. SCM_DEFINE (scm_symbol_pref, "symbol-pref", 1, 0, 0,
  304. (SCM s),
  305. "Return the @dfn{property list} currently associated with @var{symbol}.")
  306. #define FUNC_NAME s_scm_symbol_pref
  307. {
  308. SCM_VALIDATE_SYMBOL (1, s);
  309. return SCM_CDR (SCM_CELL_OBJECT_3 (s));
  310. }
  311. #undef FUNC_NAME
  312. SCM_DEFINE (scm_symbol_fset_x, "symbol-fset!", 2, 0, 0,
  313. (SCM s, SCM val),
  314. "Change the binding of @var{symbol}'s function slot.")
  315. #define FUNC_NAME s_scm_symbol_fset_x
  316. {
  317. SCM_VALIDATE_SYMBOL (1, s);
  318. SCM_SETCAR (SCM_CELL_OBJECT_3 (s), val);
  319. return SCM_UNSPECIFIED;
  320. }
  321. #undef FUNC_NAME
  322. SCM_DEFINE (scm_symbol_pset_x, "symbol-pset!", 2, 0, 0,
  323. (SCM s, SCM val),
  324. "Change the binding of @var{symbol}'s property slot.")
  325. #define FUNC_NAME s_scm_symbol_pset_x
  326. {
  327. SCM_VALIDATE_SYMBOL (1, s);
  328. SCM_SETCDR (SCM_CELL_OBJECT_3 (s), val);
  329. return SCM_UNSPECIFIED;
  330. }
  331. #undef FUNC_NAME
  332. SCM
  333. scm_from_locale_symbol (const char *sym)
  334. {
  335. return scm_i_c_mem2symbol (sym, strlen (sym));
  336. }
  337. SCM
  338. scm_from_locale_symboln (const char *sym, size_t len)
  339. {
  340. return scm_i_c_mem2symbol (sym, len);
  341. }
  342. SCM
  343. scm_take_locale_symboln (char *sym, size_t len)
  344. {
  345. SCM res;
  346. unsigned long raw_hash;
  347. if (len == (size_t)-1)
  348. len = strlen (sym);
  349. else
  350. {
  351. /* Ensure STR is null terminated. A realloc for 1 extra byte should
  352. often be satisfied from the alignment padding after the block, with
  353. no actual data movement. */
  354. sym = scm_realloc (sym, len+1);
  355. sym[len] = '\0';
  356. }
  357. raw_hash = scm_string_hash ((unsigned char *)sym, len);
  358. res = lookup_interned_symbol (sym, len, raw_hash);
  359. if (scm_is_false (res))
  360. {
  361. res = scm_i_c_take_symbol (sym, len, 0, raw_hash,
  362. scm_cons (SCM_BOOL_F, SCM_EOL));
  363. intern_symbol (res);
  364. }
  365. else
  366. free (sym);
  367. return res;
  368. }
  369. SCM
  370. scm_take_locale_symbol (char *sym)
  371. {
  372. return scm_take_locale_symboln (sym, (size_t)-1);
  373. }
  374. void
  375. scm_symbols_prehistory ()
  376. {
  377. symbols = scm_make_weak_key_hash_table (scm_from_int (2139));
  378. scm_permanent_object (symbols);
  379. }
  380. void
  381. scm_init_symbols ()
  382. {
  383. #include "libguile/symbols.x"
  384. }
  385. /*
  386. Local Variables:
  387. c-file-style: "gnu"
  388. End:
  389. */