12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221 |
- /* Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2003, 2004, 2006,
- * 2007, 2008, 2009, 2010, 2011, 2012, 2013,
- * 2014, 2015 Free Software Foundation, Inc.
- *
- * This library is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public License
- * as published by the Free Software Foundation; either version 3 of
- * the License, or (at your option) any later version.
- *
- * This library is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
- * 02110-1301 USA
- */
- /* Headers. */
- #define _LARGEFILE64_SOURCE /* ask for stat64 etc */
- #ifdef HAVE_CONFIG_H
- # include <config.h>
- #endif
- #include <stdio.h>
- #include <errno.h>
- #include <fcntl.h> /* for chsize on mingw */
- #include <assert.h>
- #include <iconv.h>
- #include <uniconv.h>
- #include <unistr.h>
- #include <striconveh.h>
- #include <assert.h>
- #include "libguile/_scm.h"
- #include "libguile/async.h"
- #include "libguile/deprecation.h"
- #include "libguile/eval.h"
- #include "libguile/fports.h" /* direct access for seek and truncate */
- #include "libguile/goops.h"
- #include "libguile/smob.h"
- #include "libguile/chars.h"
- #include "libguile/dynwind.h"
- #include "libguile/keywords.h"
- #include "libguile/hashtab.h"
- #include "libguile/root.h"
- #include "libguile/strings.h"
- #include "libguile/mallocs.h"
- #include "libguile/validate.h"
- #include "libguile/ports.h"
- #include "libguile/ports-internal.h"
- #include "libguile/vectors.h"
- #include "libguile/weak-set.h"
- #include "libguile/fluids.h"
- #include "libguile/eq.h"
- #include "libguile/alist.h"
- #ifdef HAVE_STRING_H
- #include <string.h>
- #endif
- #ifdef HAVE_IO_H
- #include <io.h>
- #endif
- #include <unistd.h>
- #ifdef HAVE_SYS_IOCTL_H
- #include <sys/ioctl.h>
- #endif
- /* Mingw (version 3.4.5, circa 2006) has ftruncate as an alias for chsize
- already, but have this code here in case that wasn't so in past versions,
- or perhaps to help other minimal DOS environments.
- gnulib ftruncate.c has code using fcntl F_CHSIZE and F_FREESP, which
- might be possibilities if we've got other systems without ftruncate. */
- #if defined HAVE_CHSIZE && ! defined HAVE_FTRUNCATE
- #define ftruncate(fd, size) chsize (fd, size)
- #undef HAVE_FTRUNCATE
- #define HAVE_FTRUNCATE 1
- #endif
- /* Port encodings are case-insensitive ASCII strings. */
- static char
- ascii_toupper (char c)
- {
- return (c < 'a' || c > 'z') ? c : ('A' + (c - 'a'));
- }
- /* It is only necessary to use this function on encodings that come from
- the user and have not been canonicalized yet. Encodings that are set
- on ports or in the default encoding fluid are in upper-case, and can
- be compared with strcmp. */
- static int
- encoding_matches (const char *enc, const char *upper)
- {
- if (!enc)
- enc = "ISO-8859-1";
- while (*enc)
- if (ascii_toupper (*enc++) != *upper++)
- return 0;
- return !*upper;
- }
- static char*
- canonicalize_encoding (const char *enc)
- {
- char *ret;
- int i;
- if (!enc)
- return "ISO-8859-1";
- ret = scm_gc_strdup (enc, "port");
- for (i = 0; ret[i]; i++)
- {
- if (ret[i] > 127)
- /* Restrict to ASCII. */
- scm_misc_error (NULL, "invalid character encoding ~s",
- scm_list_1 (scm_from_latin1_string (enc)));
- else
- ret[i] = ascii_toupper (ret[i]);
- }
- return ret;
- }
- /* The port kind table --- a dynamically resized array of port types. */
- /* scm_ptobs scm_numptob
- * implement a dynamically resized array of ptob records.
- * Indexes into this table are used when generating type
- * tags for smobjects (if you know a tag you can get an index and conversely).
- */
- static scm_t_ptob_descriptor **scm_ptobs = NULL;
- static long scm_numptob = 0; /* Number of port types. */
- static long scm_ptobs_size = 0; /* Number of slots in the port type
- table. */
- static scm_i_pthread_mutex_t scm_ptobs_lock = SCM_I_PTHREAD_MUTEX_INITIALIZER;
- long
- scm_c_num_port_types (void)
- {
- long ret;
-
- scm_i_pthread_mutex_lock (&scm_ptobs_lock);
- ret = scm_numptob;
- scm_i_pthread_mutex_unlock (&scm_ptobs_lock);
- return ret;
- }
- scm_t_ptob_descriptor*
- scm_c_port_type_ref (long ptobnum)
- {
- scm_t_ptob_descriptor *ret = NULL;
- scm_i_pthread_mutex_lock (&scm_ptobs_lock);
- if (0 <= ptobnum && ptobnum < scm_numptob)
- ret = scm_ptobs[ptobnum];
- scm_i_pthread_mutex_unlock (&scm_ptobs_lock);
- if (!ret)
- scm_out_of_range ("scm_c_port_type_ref", scm_from_long (ptobnum));
- return ret;
- }
- long
- scm_c_port_type_add_x (scm_t_ptob_descriptor *desc)
- {
- long ret = -1;
- scm_i_pthread_mutex_lock (&scm_ptobs_lock);
-
- if (scm_numptob + 1 < SCM_I_MAX_PORT_TYPE_COUNT)
- {
- if (scm_numptob == scm_ptobs_size)
- {
- unsigned long old_size = scm_ptobs_size;
- scm_t_ptob_descriptor **old_ptobs = scm_ptobs;
-
- /* Currently there are only 9 predefined port types, so one
- resize will cover it. */
- scm_ptobs_size = old_size + 10;
- if (scm_ptobs_size >= SCM_I_MAX_PORT_TYPE_COUNT)
- scm_ptobs_size = SCM_I_MAX_PORT_TYPE_COUNT;
- scm_ptobs = scm_gc_malloc (sizeof (*scm_ptobs) * scm_ptobs_size,
- "scm_ptobs");
- memcpy (scm_ptobs, old_ptobs, sizeof (*scm_ptobs) * scm_numptob);
- }
- ret = scm_numptob++;
- scm_ptobs[ret] = desc;
- }
-
- scm_i_pthread_mutex_unlock (&scm_ptobs_lock);
- if (ret < 0)
- scm_out_of_range ("scm_c_port_type_add_x", scm_from_long (scm_numptob));
- return ret;
- }
- /*
- * We choose to use an interface similar to the smob interface with
- * fill_input and write as standard fields, passed to the port
- * type constructor, and optional fields set by setters.
- */
- static void
- flush_port_default (SCM port SCM_UNUSED)
- {
- }
- static void
- end_input_default (SCM port SCM_UNUSED, int offset SCM_UNUSED)
- {
- }
- scm_t_bits
- scm_make_port_type (char *name,
- int (*fill_input) (SCM port),
- void (*write) (SCM port, const void *data, size_t size))
- {
- scm_t_ptob_descriptor *desc;
- long ptobnum;
- desc = scm_gc_malloc_pointerless (sizeof (*desc), "port-type");
- memset (desc, 0, sizeof (*desc));
- desc->name = name;
- desc->print = scm_port_print;
- desc->write = write;
- desc->flush = flush_port_default;
- desc->end_input = end_input_default;
- desc->fill_input = fill_input;
- ptobnum = scm_c_port_type_add_x (desc);
- /* Make a class object if GOOPS is present. */
- if (SCM_UNPACK (scm_i_port_class[0]) != 0)
- scm_make_port_classes (ptobnum, name);
- return scm_tc7_port + ptobnum * 256;
- }
- void
- scm_set_port_mark (scm_t_bits tc, SCM (*mark) (SCM))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->mark = mark;
- }
- void
- scm_set_port_free (scm_t_bits tc, size_t (*free) (SCM))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->free = free;
- }
- void
- scm_set_port_print (scm_t_bits tc, int (*print) (SCM exp, SCM port,
- scm_print_state *pstate))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->print = print;
- }
- void
- scm_set_port_equalp (scm_t_bits tc, SCM (*equalp) (SCM, SCM))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->equalp = equalp;
- }
- void
- scm_set_port_close (scm_t_bits tc, int (*close) (SCM))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->close = close;
- }
- void
- scm_set_port_flush (scm_t_bits tc, void (*flush) (SCM port))
- {
- scm_t_ptob_descriptor *ptob = scm_c_port_type_ref (SCM_TC2PTOBNUM (tc));
- ptob->flush = flush;
- ptob->flags |= SCM_PORT_TYPE_HAS_FLUSH;
- }
- void
- scm_set_port_end_input (scm_t_bits tc, void (*end_input) (SCM port, int offset))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->end_input = end_input;
- }
- void
- scm_set_port_seek (scm_t_bits tc, scm_t_off (*seek) (SCM, scm_t_off, int))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->seek = seek;
- }
- void
- scm_set_port_truncate (scm_t_bits tc, void (*truncate) (SCM, scm_t_off))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->truncate = truncate;
- }
- void
- scm_set_port_input_waiting (scm_t_bits tc, int (*input_waiting) (SCM))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->input_waiting = input_waiting;
- }
- void
- scm_set_port_setvbuf (scm_t_bits tc, void (*setvbuf) (SCM, long, long))
- {
- scm_c_port_type_ref (SCM_TC2PTOBNUM (tc))->setvbuf = setvbuf;
- }
- static void
- scm_i_set_pending_eof (SCM port)
- {
- SCM_PORT_GET_INTERNAL (port)->pending_eof = 1;
- }
- static void
- scm_i_clear_pending_eof (SCM port)
- {
- SCM_PORT_GET_INTERNAL (port)->pending_eof = 0;
- }
- SCM_DEFINE (scm_i_port_property, "%port-property", 2, 0, 0,
- (SCM port, SCM key),
- "Return the property of @var{port} associated with @var{key}.")
- #define FUNC_NAME s_scm_i_port_property
- {
- scm_i_pthread_mutex_t *lock;
- SCM result;
- SCM_VALIDATE_OPPORT (1, port);
- scm_c_lock_port (port, &lock);
- result = scm_assq_ref (SCM_PORT_GET_INTERNAL (port)->alist, key);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- return result;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_i_set_port_property_x, "%set-port-property!", 3, 0, 0,
- (SCM port, SCM key, SCM value),
- "Set the property of @var{port} associated with @var{key} to @var{value}.")
- #define FUNC_NAME s_scm_i_set_port_property_x
- {
- scm_i_pthread_mutex_t *lock;
- scm_t_port_internal *pti;
- SCM_VALIDATE_OPPORT (1, port);
- scm_c_lock_port (port, &lock);
- pti = SCM_PORT_GET_INTERNAL (port);
- pti->alist = scm_assq_set_x (pti->alist, key, value);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* Standard ports --- current input, output, error, and more(!). */
- static SCM cur_inport_fluid = SCM_BOOL_F;
- static SCM cur_outport_fluid = SCM_BOOL_F;
- static SCM cur_errport_fluid = SCM_BOOL_F;
- static SCM cur_warnport_fluid = SCM_BOOL_F;
- static SCM cur_loadport_fluid = SCM_BOOL_F;
- SCM_DEFINE (scm_current_input_port, "current-input-port", 0, 0, 0,
- (void),
- "Return the current input port. This is the default port used\n"
- "by many input procedures. Initially, @code{current-input-port}\n"
- "returns the @dfn{standard input} in Unix and C terminology.")
- #define FUNC_NAME s_scm_current_input_port
- {
- if (scm_is_true (cur_inport_fluid))
- return scm_fluid_ref (cur_inport_fluid);
- else
- return SCM_BOOL_F;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_current_output_port, "current-output-port", 0, 0, 0,
- (void),
- "Return the current output port. This is the default port used\n"
- "by many output procedures. Initially,\n"
- "@code{current-output-port} returns the @dfn{standard output} in\n"
- "Unix and C terminology.")
- #define FUNC_NAME s_scm_current_output_port
- {
- if (scm_is_true (cur_outport_fluid))
- return scm_fluid_ref (cur_outport_fluid);
- else
- return SCM_BOOL_F;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_current_error_port, "current-error-port", 0, 0, 0,
- (void),
- "Return the port to which errors and warnings should be sent (the\n"
- "@dfn{standard error} in Unix and C terminology).")
- #define FUNC_NAME s_scm_current_error_port
- {
- if (scm_is_true (cur_errport_fluid))
- return scm_fluid_ref (cur_errport_fluid);
- else
- return SCM_BOOL_F;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_current_warning_port, "current-warning-port", 0, 0, 0,
- (void),
- "Return the port to which diagnostic warnings should be sent.")
- #define FUNC_NAME s_scm_current_warning_port
- {
- if (scm_is_true (cur_warnport_fluid))
- return scm_fluid_ref (cur_warnport_fluid);
- else
- return SCM_BOOL_F;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_current_load_port, "current-load-port", 0, 0, 0,
- (),
- "Return the current-load-port.\n"
- "The load port is used internally by @code{primitive-load}.")
- #define FUNC_NAME s_scm_current_load_port
- {
- return scm_fluid_ref (cur_loadport_fluid);
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_current_input_port, "set-current-input-port", 1, 0, 0,
- (SCM port),
- "@deffnx {Scheme Procedure} set-current-output-port port\n"
- "@deffnx {Scheme Procedure} set-current-error-port port\n"
- "Change the ports returned by @code{current-input-port},\n"
- "@code{current-output-port} and @code{current-error-port}, respectively,\n"
- "so that they use the supplied @var{port} for input or output.")
- #define FUNC_NAME s_scm_set_current_input_port
- {
- SCM oinp = scm_fluid_ref (cur_inport_fluid);
- SCM_VALIDATE_OPINPORT (1, port);
- scm_fluid_set_x (cur_inport_fluid, port);
- return oinp;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_current_output_port, "set-current-output-port", 1, 0, 0,
- (SCM port),
- "Set the current default output port to @var{port}.")
- #define FUNC_NAME s_scm_set_current_output_port
- {
- SCM ooutp = scm_fluid_ref (cur_outport_fluid);
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- scm_fluid_set_x (cur_outport_fluid, port);
- return ooutp;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_current_error_port, "set-current-error-port", 1, 0, 0,
- (SCM port),
- "Set the current default error port to @var{port}.")
- #define FUNC_NAME s_scm_set_current_error_port
- {
- SCM oerrp = scm_fluid_ref (cur_errport_fluid);
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- scm_fluid_set_x (cur_errport_fluid, port);
- return oerrp;
- }
- #undef FUNC_NAME
- SCM
- scm_set_current_warning_port (SCM port)
- #define FUNC_NAME "set-current-warning-port"
- {
- SCM owarnp = scm_fluid_ref (cur_warnport_fluid);
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- scm_fluid_set_x (cur_warnport_fluid, port);
- return owarnp;
- }
- #undef FUNC_NAME
- void
- scm_dynwind_current_input_port (SCM port)
- #define FUNC_NAME NULL
- {
- SCM_VALIDATE_OPINPORT (1, port);
- scm_dynwind_fluid (cur_inport_fluid, port);
- }
- #undef FUNC_NAME
- void
- scm_dynwind_current_output_port (SCM port)
- #define FUNC_NAME NULL
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- scm_dynwind_fluid (cur_outport_fluid, port);
- }
- #undef FUNC_NAME
- void
- scm_dynwind_current_error_port (SCM port)
- #define FUNC_NAME NULL
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- scm_dynwind_fluid (cur_errport_fluid, port);
- }
- #undef FUNC_NAME
- void
- scm_i_dynwind_current_load_port (SCM port)
- {
- scm_dynwind_fluid (cur_loadport_fluid, port);
- }
- /* Retrieving a port's mode. */
- /* Return the flags that characterize a port based on the mode
- * string used to open a file for that port.
- *
- * See PORT FLAGS in scm.h
- */
- static long
- scm_i_mode_bits_n (SCM modes)
- {
- return (SCM_OPN
- | (scm_i_string_contains_char (modes, 'r')
- || scm_i_string_contains_char (modes, '+') ? SCM_RDNG : 0)
- | (scm_i_string_contains_char (modes, 'w')
- || scm_i_string_contains_char (modes, 'a')
- || scm_i_string_contains_char (modes, '+') ? SCM_WRTNG : 0)
- | (scm_i_string_contains_char (modes, '0') ? SCM_BUF0 : 0)
- | (scm_i_string_contains_char (modes, 'l') ? SCM_BUFLINE : 0));
- }
- long
- scm_mode_bits (char *modes)
- {
- /* Valid characters are rw+a0l. So, use latin1. */
- return scm_i_mode_bits (scm_from_latin1_string (modes));
- }
- long
- scm_i_mode_bits (SCM modes)
- {
- long bits;
- if (!scm_is_string (modes))
- scm_wrong_type_arg_msg (NULL, 0, modes, "string");
- bits = scm_i_mode_bits_n (modes);
- scm_remember_upto_here_1 (modes);
- return bits;
- }
- /* Return the mode flags from an open port.
- * Some modes such as "append" are only used when opening
- * a file and are not returned here. */
- SCM_DEFINE (scm_port_mode, "port-mode", 1, 0, 0,
- (SCM port),
- "Return the port modes associated with the open port @var{port}.\n"
- "These will not necessarily be identical to the modes used when\n"
- "the port was opened, since modes such as \"append\" which are\n"
- "used only during port creation are not retained.")
- #define FUNC_NAME s_scm_port_mode
- {
- char modes[4];
- modes[0] = '\0';
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPPORT (1, port);
- if (SCM_CELL_WORD_0 (port) & SCM_RDNG) {
- if (SCM_CELL_WORD_0 (port) & SCM_WRTNG)
- strcpy (modes, "r+");
- else
- strcpy (modes, "r");
- }
- else if (SCM_CELL_WORD_0 (port) & SCM_WRTNG)
- strcpy (modes, "w");
- if (SCM_CELL_WORD_0 (port) & SCM_BUF0)
- strcat (modes, "0");
- return scm_from_latin1_string (modes);
- }
- #undef FUNC_NAME
- /* The port table --- a weak set of all ports.
- We need a global registry of ports to flush them all at exit, and to
- get all the ports matching a file descriptor. */
- SCM scm_i_port_weak_set;
- /* Port finalization. */
- struct do_free_data
- {
- scm_t_ptob_descriptor *ptob;
- SCM port;
- };
- static SCM
- do_free (void *body_data)
- {
- struct do_free_data *data = body_data;
- /* `close' is for explicit `close-port' by user. `free' is for this
- purpose: ports collected by the GC. */
- data->ptob->free (data->port);
- return SCM_BOOL_T;
- }
- /* Finalize the object (a port) pointed to by PTR. */
- static void
- finalize_port (void *ptr, void *data)
- {
- SCM port = SCM_PACK_POINTER (ptr);
- if (!SCM_PORTP (port))
- abort ();
- if (SCM_OPENP (port))
- {
- struct do_free_data data;
- SCM_CLR_PORT_OPEN_FLAG (port);
- data.ptob = SCM_PORT_DESCRIPTOR (port);
- data.port = port;
- scm_internal_catch (SCM_BOOL_T, do_free, &data,
- scm_handle_by_message_noexit, NULL);
- scm_gc_ports_collected++;
- }
- }
- SCM
- scm_c_make_port_with_encoding (scm_t_bits tag, unsigned long mode_bits,
- const char *encoding,
- scm_t_string_failed_conversion_handler handler,
- scm_t_bits stream)
- {
- SCM ret;
- scm_t_port *entry;
- scm_t_port_internal *pti;
- scm_t_ptob_descriptor *ptob;
- entry = scm_gc_typed_calloc (scm_t_port);
- pti = scm_gc_typed_calloc (scm_t_port_internal);
- ptob = scm_c_port_type_ref (SCM_TC2PTOBNUM (tag));
- ret = scm_words (tag | mode_bits, 3);
- SCM_SET_CELL_WORD_1 (ret, (scm_t_bits) entry);
- SCM_SET_CELL_WORD_2 (ret, (scm_t_bits) ptob);
- entry->lock = scm_gc_malloc_pointerless (sizeof (*entry->lock), "port lock");
- scm_i_pthread_mutex_init (entry->lock, scm_i_pthread_mutexattr_recursive);
- entry->internal = pti;
- entry->file_name = SCM_BOOL_F;
- entry->rw_active = SCM_PORT_NEITHER;
- entry->port = ret;
- entry->stream = stream;
- if (encoding_matches (encoding, "UTF-8"))
- {
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_UTF8;
- entry->encoding = "UTF-8";
- }
- else if (encoding_matches (encoding, "ISO-8859-1"))
- {
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_LATIN1;
- entry->encoding = "ISO-8859-1";
- }
- else
- {
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_ICONV;
- entry->encoding = canonicalize_encoding (encoding);
- }
- entry->ilseq_handler = handler;
- pti->iconv_descriptors = NULL;
- pti->at_stream_start_for_bom_read = 1;
- pti->at_stream_start_for_bom_write = 1;
- pti->pending_eof = 0;
- pti->alist = SCM_EOL;
- if (SCM_PORT_DESCRIPTOR (ret)->free)
- scm_i_set_finalizer (SCM2PTR (ret), finalize_port, NULL);
- if (SCM_PORT_DESCRIPTOR (ret)->flags & SCM_PORT_TYPE_HAS_FLUSH)
- scm_weak_set_add_x (scm_i_port_weak_set, ret);
- return ret;
- }
- SCM
- scm_c_make_port (scm_t_bits tag, unsigned long mode_bits, scm_t_bits stream)
- {
- return scm_c_make_port_with_encoding (tag, mode_bits,
- scm_i_default_port_encoding (),
- scm_i_default_port_conversion_handler (),
- stream);
- }
- SCM
- scm_new_port_table_entry (scm_t_bits tag)
- {
- return scm_c_make_port (tag, 0, 0);
- }
- /* Predicates. */
- SCM_DEFINE (scm_port_p, "port?", 1, 0, 0,
- (SCM x),
- "Return a boolean indicating whether @var{x} is a port.\n"
- "Equivalent to @code{(or (input-port? @var{x}) (output-port?\n"
- "@var{x}))}.")
- #define FUNC_NAME s_scm_port_p
- {
- return scm_from_bool (SCM_PORTP (x));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_input_port_p, "input-port?", 1, 0, 0,
- (SCM x),
- "Return @code{#t} if @var{x} is an input port, otherwise return\n"
- "@code{#f}. Any object satisfying this predicate also satisfies\n"
- "@code{port?}.")
- #define FUNC_NAME s_scm_input_port_p
- {
- return scm_from_bool (SCM_INPUT_PORT_P (x));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_output_port_p, "output-port?", 1, 0, 0,
- (SCM x),
- "Return @code{#t} if @var{x} is an output port, otherwise return\n"
- "@code{#f}. Any object satisfying this predicate also satisfies\n"
- "@code{port?}.")
- #define FUNC_NAME s_scm_output_port_p
- {
- x = SCM_COERCE_OUTPORT (x);
- return scm_from_bool (SCM_OUTPUT_PORT_P (x));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_port_closed_p, "port-closed?", 1, 0, 0,
- (SCM port),
- "Return @code{#t} if @var{port} is closed or @code{#f} if it is\n"
- "open.")
- #define FUNC_NAME s_scm_port_closed_p
- {
- SCM_VALIDATE_PORT (1, port);
- return scm_from_bool (!SCM_OPPORTP (port));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_eof_object_p, "eof-object?", 1, 0, 0,
- (SCM x),
- "Return @code{#t} if @var{x} is an end-of-file object; otherwise\n"
- "return @code{#f}.")
- #define FUNC_NAME s_scm_eof_object_p
- {
- return scm_from_bool (SCM_EOF_OBJECT_P (x));
- }
- #undef FUNC_NAME
- /* Closing ports. */
- static void close_iconv_descriptors (scm_t_iconv_descriptors *id);
- /* scm_close_port
- * Call the close operation on a port object.
- * see also scm_close.
- */
- SCM_DEFINE (scm_close_port, "close-port", 1, 0, 0,
- (SCM port),
- "Close the specified port object. Return @code{#t} if it\n"
- "successfully closes a port or @code{#f} if it was already\n"
- "closed. An exception may be raised if an error occurs, for\n"
- "example when flushing buffered output. See also @ref{Ports and\n"
- "File Descriptors, close}, for a procedure which can close file\n"
- "descriptors.")
- #define FUNC_NAME s_scm_close_port
- {
- scm_t_port_internal *pti;
- int rv;
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_PORT (1, port);
- if (SCM_CLOSEDP (port))
- return SCM_BOOL_F;
- pti = SCM_PORT_GET_INTERNAL (port);
- SCM_CLR_PORT_OPEN_FLAG (port);
- if (SCM_PORT_DESCRIPTOR (port)->flags & SCM_PORT_TYPE_HAS_FLUSH)
- scm_weak_set_remove_x (scm_i_port_weak_set, port);
- if (SCM_PORT_DESCRIPTOR (port)->close)
- /* Note! This may throw an exception. Anything after this point
- should be resilient to non-local exits. */
- rv = SCM_PORT_DESCRIPTOR (port)->close (port);
- else
- rv = 0;
- if (pti->iconv_descriptors)
- {
- /* If we don't get here, the iconv_descriptors finalizer will
- clean up. */
- close_iconv_descriptors (pti->iconv_descriptors);
- pti->iconv_descriptors = NULL;
- }
- return scm_from_bool (rv >= 0);
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_close_input_port, "close-input-port", 1, 0, 0,
- (SCM port),
- "Close the specified input port object. The routine has no effect if\n"
- "the file has already been closed. An exception may be raised if an\n"
- "error occurs. The value returned is unspecified.\n\n"
- "See also @ref{Ports and File Descriptors, close}, for a procedure\n"
- "which can close file descriptors.")
- #define FUNC_NAME s_scm_close_input_port
- {
- SCM_VALIDATE_INPUT_PORT (1, port);
- scm_close_port (port);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_close_output_port, "close-output-port", 1, 0, 0,
- (SCM port),
- "Close the specified output port object. The routine has no effect if\n"
- "the file has already been closed. An exception may be raised if an\n"
- "error occurs. The value returned is unspecified.\n\n"
- "See also @ref{Ports and File Descriptors, close}, for a procedure\n"
- "which can close file descriptors.")
- #define FUNC_NAME s_scm_close_output_port
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OUTPUT_PORT (1, port);
- scm_close_port (port);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* Encoding characters to byte streams, and decoding byte streams to
- characters. */
- /* A fluid specifying the default encoding for newly created ports. If it is
- a string, that is the encoding. If it is #f, it is in the "native"
- (Latin-1) encoding. */
- SCM_VARIABLE (default_port_encoding_var, "%default-port-encoding");
- static int scm_port_encoding_init = 0;
- /* Use ENCODING as the default encoding for future ports. */
- void
- scm_i_set_default_port_encoding (const char *encoding)
- {
- if (!scm_port_encoding_init
- || !scm_is_fluid (SCM_VARIABLE_REF (default_port_encoding_var)))
- scm_misc_error (NULL, "tried to set port encoding fluid before it is initialized",
- SCM_EOL);
- if (encoding_matches (encoding, "ISO-8859-1"))
- scm_fluid_set_x (SCM_VARIABLE_REF (default_port_encoding_var), SCM_BOOL_F);
- else
- scm_fluid_set_x (SCM_VARIABLE_REF (default_port_encoding_var),
- scm_from_latin1_string (canonicalize_encoding (encoding)));
- }
- /* Return the name of the default encoding for newly created ports. */
- const char *
- scm_i_default_port_encoding (void)
- {
- if (!scm_port_encoding_init)
- return "ISO-8859-1";
- else if (!scm_is_fluid (SCM_VARIABLE_REF (default_port_encoding_var)))
- return "ISO-8859-1";
- else
- {
- SCM encoding;
- encoding = scm_fluid_ref (SCM_VARIABLE_REF (default_port_encoding_var));
- if (!scm_is_string (encoding))
- return "ISO-8859-1";
- else
- return scm_i_string_chars (encoding);
- }
- }
- /* A fluid specifying the default conversion handler for newly created
- ports. Its value should be one of the symbols below. */
- SCM_VARIABLE (default_conversion_strategy_var,
- "%default-port-conversion-strategy");
- /* Whether the above fluid is initialized. */
- static int scm_conversion_strategy_init = 0;
- /* The possible conversion strategies. */
- SCM_SYMBOL (sym_error, "error");
- SCM_SYMBOL (sym_substitute, "substitute");
- SCM_SYMBOL (sym_escape, "escape");
- /* Return the default failed encoding conversion policy for new created
- ports. */
- scm_t_string_failed_conversion_handler
- scm_i_default_port_conversion_handler (void)
- {
- scm_t_string_failed_conversion_handler handler;
- if (!scm_conversion_strategy_init
- || !scm_is_fluid (SCM_VARIABLE_REF (default_conversion_strategy_var)))
- handler = SCM_FAILED_CONVERSION_QUESTION_MARK;
- else
- {
- SCM fluid, value;
- fluid = SCM_VARIABLE_REF (default_conversion_strategy_var);
- value = scm_fluid_ref (fluid);
- if (scm_is_eq (sym_substitute, value))
- handler = SCM_FAILED_CONVERSION_QUESTION_MARK;
- else if (scm_is_eq (sym_escape, value))
- handler = SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE;
- else
- /* Default to 'error also when the fluid's value is not one of
- the valid symbols. */
- handler = SCM_FAILED_CONVERSION_ERROR;
- }
- return handler;
- }
- /* Use HANDLER as the default conversion strategy for future ports. */
- void
- scm_i_set_default_port_conversion_handler (scm_t_string_failed_conversion_handler
- handler)
- {
- SCM strategy;
- if (!scm_conversion_strategy_init
- || !scm_is_fluid (SCM_VARIABLE_REF (default_conversion_strategy_var)))
- scm_misc_error (NULL, "tried to set conversion strategy fluid before it is initialized",
- SCM_EOL);
- switch (handler)
- {
- case SCM_FAILED_CONVERSION_ERROR:
- strategy = sym_error;
- break;
- case SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE:
- strategy = sym_escape;
- break;
- case SCM_FAILED_CONVERSION_QUESTION_MARK:
- strategy = sym_substitute;
- break;
- default:
- abort ();
- }
- scm_fluid_set_x (SCM_VARIABLE_REF (default_conversion_strategy_var),
- strategy);
- }
- static void
- scm_i_unget_bytes_unlocked (const unsigned char *buf, size_t len, SCM port);
- /* If the next LEN bytes from PORT are equal to those in BYTES, then
- return 1, else return 0. Leave the port position unchanged. */
- static int
- looking_at_bytes (SCM port, const unsigned char *bytes, int len)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- int i = 0;
- while (i < len && scm_peek_byte_or_eof_unlocked (port) == bytes[i])
- {
- pt->read_pos++;
- i++;
- }
- scm_i_unget_bytes_unlocked (bytes, i, port);
- return (i == len);
- }
- static const unsigned char scm_utf8_bom[3] = {0xEF, 0xBB, 0xBF};
- static const unsigned char scm_utf16be_bom[2] = {0xFE, 0xFF};
- static const unsigned char scm_utf16le_bom[2] = {0xFF, 0xFE};
- static const unsigned char scm_utf32be_bom[4] = {0x00, 0x00, 0xFE, 0xFF};
- static const unsigned char scm_utf32le_bom[4] = {0xFF, 0xFE, 0x00, 0x00};
- /* Decide what byte order to use for a UTF-16 port. Return "UTF-16BE"
- or "UTF-16LE". MODE must be either SCM_PORT_READ or SCM_PORT_WRITE,
- and specifies which operation is about to be done. The MODE
- determines how we will decide the byte order. We deliberately avoid
- reading from the port unless the user is about to do so. If the user
- is about to read, then we look for a BOM, and if present, we use it
- to determine the byte order. Otherwise we choose big endian, as
- recommended by the Unicode Standard. Note that the BOM (if any) is
- not consumed here. */
- static const char *
- decide_utf16_encoding (SCM port, scm_t_port_rw_active mode)
- {
- if (mode == SCM_PORT_READ
- && SCM_PORT_GET_INTERNAL (port)->at_stream_start_for_bom_read
- && looking_at_bytes (port, scm_utf16le_bom, sizeof scm_utf16le_bom))
- return "UTF-16LE";
- else
- return "UTF-16BE";
- }
- /* Decide what byte order to use for a UTF-32 port. Return "UTF-32BE"
- or "UTF-32LE". See the comment above 'decide_utf16_encoding' for
- details. */
- static const char *
- decide_utf32_encoding (SCM port, scm_t_port_rw_active mode)
- {
- if (mode == SCM_PORT_READ
- && SCM_PORT_GET_INTERNAL (port)->at_stream_start_for_bom_read
- && looking_at_bytes (port, scm_utf32le_bom, sizeof scm_utf32le_bom))
- return "UTF-32LE";
- else
- return "UTF-32BE";
- }
- static void
- finalize_iconv_descriptors (void *ptr, void *data)
- {
- close_iconv_descriptors (ptr);
- }
- static scm_t_iconv_descriptors *
- open_iconv_descriptors (const char *encoding, int reading, int writing)
- {
- scm_t_iconv_descriptors *id;
- iconv_t input_cd, output_cd;
- size_t i;
- input_cd = (iconv_t) -1;
- output_cd = (iconv_t) -1;
- for (i = 0; encoding[i]; i++)
- if (encoding[i] > 127)
- goto invalid_encoding;
- if (reading)
- {
- /* Open an input iconv conversion descriptor, from ENCODING
- to UTF-8. We choose UTF-8, not UTF-32, because iconv
- implementations can typically convert from anything to
- UTF-8, but not to UTF-32 (see
- <http://lists.gnu.org/archive/html/bug-libunistring/2010-09/msg00007.html>). */
- /* Assume opening an iconv descriptor causes about 16 KB of
- allocation. */
- scm_gc_register_allocation (16 * 1024);
- input_cd = iconv_open ("UTF-8", encoding);
- if (input_cd == (iconv_t) -1)
- goto invalid_encoding;
- }
- if (writing)
- {
- /* Assume opening an iconv descriptor causes about 16 KB of
- allocation. */
- scm_gc_register_allocation (16 * 1024);
- output_cd = iconv_open (encoding, "UTF-8");
- if (output_cd == (iconv_t) -1)
- {
- if (input_cd != (iconv_t) -1)
- iconv_close (input_cd);
- goto invalid_encoding;
- }
- }
- id = scm_gc_malloc_pointerless (sizeof (*id), "iconv descriptors");
- id->input_cd = input_cd;
- id->output_cd = output_cd;
- /* Register a finalizer to close the descriptors. */
- scm_i_set_finalizer (id, finalize_iconv_descriptors, NULL);
- return id;
- invalid_encoding:
- {
- SCM err;
- err = scm_from_latin1_string (encoding);
- scm_misc_error ("open_iconv_descriptors",
- "invalid or unknown character encoding ~s",
- scm_list_1 (err));
- }
- }
- static void
- close_iconv_descriptors (scm_t_iconv_descriptors *id)
- {
- if (id->input_cd != (iconv_t) -1)
- iconv_close (id->input_cd);
- if (id->output_cd != (iconv_t) -1)
- iconv_close (id->output_cd);
- id->input_cd = (void *) -1;
- id->output_cd = (void *) -1;
- }
- scm_t_iconv_descriptors *
- scm_i_port_iconv_descriptors (SCM port, scm_t_port_rw_active mode)
- {
- scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
- assert (pti->encoding_mode == SCM_PORT_ENCODING_MODE_ICONV);
- if (!pti->iconv_descriptors)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- const char *precise_encoding;
- if (!pt->encoding)
- pt->encoding = "ISO-8859-1";
- /* If the specified encoding is UTF-16 or UTF-32, then make
- that more precise by deciding what byte order to use. */
- if (strcmp (pt->encoding, "UTF-16") == 0)
- precise_encoding = decide_utf16_encoding (port, mode);
- else if (strcmp (pt->encoding, "UTF-32") == 0)
- precise_encoding = decide_utf32_encoding (port, mode);
- else
- precise_encoding = pt->encoding;
- pti->iconv_descriptors =
- open_iconv_descriptors (precise_encoding,
- SCM_INPUT_PORT_P (port),
- SCM_OUTPUT_PORT_P (port));
- }
- return pti->iconv_descriptors;
- }
- /* The name of the encoding is itself encoded in ASCII. */
- void
- scm_i_set_port_encoding_x (SCM port, const char *encoding)
- {
- scm_t_port *pt;
- scm_t_port_internal *pti;
- scm_t_iconv_descriptors *prev;
- /* Set the character encoding for this port. */
- pt = SCM_PTAB_ENTRY (port);
- pti = SCM_PORT_GET_INTERNAL (port);
- prev = pti->iconv_descriptors;
- /* In order to handle cases where the encoding changes mid-stream
- (e.g. within an HTTP stream, or within a file that is composed of
- segments with different encodings), we consider this to be "stream
- start" for purposes of BOM handling, regardless of our actual file
- position. */
- pti->at_stream_start_for_bom_read = 1;
- pti->at_stream_start_for_bom_write = 1;
- if (encoding_matches (encoding, "UTF-8"))
- {
- pt->encoding = "UTF-8";
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_UTF8;
- }
- else if (encoding_matches (encoding, "ISO-8859-1"))
- {
- pt->encoding = "ISO-8859-1";
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_LATIN1;
- }
- else
- {
- pt->encoding = canonicalize_encoding (encoding);
- pti->encoding_mode = SCM_PORT_ENCODING_MODE_ICONV;
- }
- pti->iconv_descriptors = NULL;
- if (prev)
- close_iconv_descriptors (prev);
- }
- SCM_DEFINE (scm_port_encoding, "port-encoding", 1, 0, 0,
- (SCM port),
- "Returns, as a string, the character encoding that @var{port}\n"
- "uses to interpret its input and output.\n")
- #define FUNC_NAME s_scm_port_encoding
- {
- SCM_VALIDATE_PORT (1, port);
- return scm_from_latin1_string (SCM_PTAB_ENTRY (port)->encoding);
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_port_encoding_x, "set-port-encoding!", 2, 0, 0,
- (SCM port, SCM enc),
- "Sets the character encoding that will be used to interpret all\n"
- "port I/O. New ports are created with the encoding\n"
- "appropriate for the current locale if @code{setlocale} has \n"
- "been called or ISO-8859-1 otherwise\n"
- "and this procedure can be used to modify that encoding.\n")
- #define FUNC_NAME s_scm_set_port_encoding_x
- {
- char *enc_str;
- SCM_VALIDATE_PORT (1, port);
- SCM_VALIDATE_STRING (2, enc);
- enc_str = scm_to_latin1_string (enc);
- scm_i_set_port_encoding_x (port, enc_str);
- free (enc_str);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_port_conversion_strategy, "port-conversion-strategy",
- 1, 0, 0, (SCM port),
- "Returns the behavior of the port when handling a character that\n"
- "is not representable in the port's current encoding.\n"
- "It returns the symbol @code{error} if unrepresentable characters\n"
- "should cause exceptions, @code{substitute} if the port should\n"
- "try to replace unrepresentable characters with question marks or\n"
- "approximate characters, or @code{escape} if unrepresentable\n"
- "characters should be converted to string escapes.\n"
- "\n"
- "If @var{port} is @code{#f}, then the current default behavior\n"
- "will be returned. New ports will have this default behavior\n"
- "when they are created.\n")
- #define FUNC_NAME s_scm_port_conversion_strategy
- {
- scm_t_string_failed_conversion_handler h;
- if (scm_is_false (port))
- h = scm_i_default_port_conversion_handler ();
- else
- {
- scm_t_port *pt;
- SCM_VALIDATE_OPPORT (1, port);
- pt = SCM_PTAB_ENTRY (port);
- h = pt->ilseq_handler;
- }
- if (h == SCM_FAILED_CONVERSION_ERROR)
- return scm_from_latin1_symbol ("error");
- else if (h == SCM_FAILED_CONVERSION_QUESTION_MARK)
- return scm_from_latin1_symbol ("substitute");
- else if (h == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
- return scm_from_latin1_symbol ("escape");
- else
- abort ();
- /* Never gets here. */
- return SCM_UNDEFINED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_port_conversion_strategy_x, "set-port-conversion-strategy!",
- 2, 0, 0,
- (SCM port, SCM sym),
- "Sets the behavior of the interpreter when outputting a character\n"
- "that is not representable in the port's current encoding.\n"
- "@var{sym} can be either @code{'error}, @code{'substitute}, or\n"
- "@code{'escape}. If it is @code{'error}, an error will be thrown\n"
- "when an unconvertible character is encountered. If it is\n"
- "@code{'substitute}, then unconvertible characters will \n"
- "be replaced with approximate characters, or with question marks\n"
- "if no approximately correct character is available.\n"
- "If it is @code{'escape},\n"
- "it will appear as a hex escape when output.\n"
- "\n"
- "If @var{port} is an open port, the conversion error behavior\n"
- "is set for that port. If it is @code{#f}, it is set as the\n"
- "default behavior for any future ports that get created in\n"
- "this thread.\n")
- #define FUNC_NAME s_scm_set_port_conversion_strategy_x
- {
- scm_t_string_failed_conversion_handler handler;
- if (scm_is_eq (sym, sym_error))
- handler = SCM_FAILED_CONVERSION_ERROR;
- else if (scm_is_eq (sym, sym_substitute))
- handler = SCM_FAILED_CONVERSION_QUESTION_MARK;
- else if (scm_is_eq (sym, sym_escape))
- handler = SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE;
- else
- SCM_MISC_ERROR ("unknown conversion strategy ~s", scm_list_1 (sym));
- if (scm_is_false (port))
- scm_i_set_default_port_conversion_handler (handler);
- else
- {
- SCM_VALIDATE_OPPORT (1, port);
- SCM_PTAB_ENTRY (port)->ilseq_handler = handler;
- }
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* The port lock. */
- static void
- lock_port (void *mutex)
- {
- scm_i_pthread_mutex_lock ((scm_i_pthread_mutex_t *) mutex);
- }
- static void
- unlock_port (void *mutex)
- {
- scm_i_pthread_mutex_unlock ((scm_i_pthread_mutex_t *) mutex);
- }
- void
- scm_dynwind_lock_port (SCM port)
- #define FUNC_NAME "dynwind-lock-port"
- {
- scm_i_pthread_mutex_t *lock;
- SCM_VALIDATE_OPPORT (SCM_ARG1, port);
- scm_c_lock_port (port, &lock);
- if (lock)
- {
- scm_dynwind_unwind_handler (unlock_port, lock, SCM_F_WIND_EXPLICITLY);
- scm_dynwind_rewind_handler (lock_port, lock, 0);
- }
- }
- #undef FUNC_NAME
- /* Input. */
- int
- scm_get_byte_or_eof (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- int ret;
- scm_c_lock_port (port, &lock);
- ret = scm_get_byte_or_eof_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- return ret;
- }
- int
- scm_peek_byte_or_eof (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- int ret;
- scm_c_lock_port (port, &lock);
- ret = scm_peek_byte_or_eof_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- return ret;
- }
- /* scm_c_read
- *
- * Used by an application to read arbitrary number of bytes from an
- * SCM port. Same semantics as libc read, except that scm_c_read only
- * returns less than SIZE bytes if at end-of-file.
- *
- * Warning: Doesn't update port line and column counts! */
- /* This structure, and the following swap_buffer function, are used
- for temporarily swapping a port's own read buffer, and the buffer
- that the caller of scm_c_read provides. */
- struct port_and_swap_buffer
- {
- scm_t_port *pt;
- unsigned char *buffer;
- size_t size;
- };
- static void
- swap_buffer (void *data)
- {
- struct port_and_swap_buffer *psb = (struct port_and_swap_buffer *) data;
- unsigned char *old_buf = psb->pt->read_buf;
- size_t old_size = psb->pt->read_buf_size;
- /* Make the port use (buffer, size) from the struct. */
- psb->pt->read_pos = psb->pt->read_buf = psb->pt->read_end = psb->buffer;
- psb->pt->read_buf_size = psb->size;
- /* Save the port's old (buffer, size) in the struct. */
- psb->buffer = old_buf;
- psb->size = old_size;
- }
- static int scm_i_fill_input_unlocked (SCM port);
- size_t
- scm_c_read_unlocked (SCM port, void *buffer, size_t size)
- #define FUNC_NAME "scm_c_read"
- {
- scm_t_port *pt;
- scm_t_port_internal *pti;
- size_t n_read = 0, n_available;
- struct port_and_swap_buffer psb;
- SCM_VALIDATE_OPINPORT (1, port);
- pt = SCM_PTAB_ENTRY (port);
- pti = SCM_PORT_GET_INTERNAL (port);
- if (pt->rw_active == SCM_PORT_WRITE)
- SCM_PORT_DESCRIPTOR (port)->flush (port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_READ;
- /* Take bytes first from the port's read buffer. */
- if (pt->read_pos < pt->read_end)
- {
- n_available = min (size, pt->read_end - pt->read_pos);
- memcpy (buffer, pt->read_pos, n_available);
- buffer = (char *) buffer + n_available;
- pt->read_pos += n_available;
- n_read += n_available;
- size -= n_available;
- }
- /* Avoid the scm_dynwind_* costs if we now have enough data. */
- if (size == 0)
- return n_read;
- /* Now we will call scm_i_fill_input_unlocked repeatedly until we have
- read the requested number of bytes. (Note that a single
- scm_i_fill_input_unlocked call does not guarantee to fill the whole
- of the port's read buffer.) */
- if (pt->read_buf_size <= 1
- && pti->encoding_mode == SCM_PORT_ENCODING_MODE_LATIN1)
- {
- /* The port that we are reading from is unbuffered - i.e. does not
- have its own persistent buffer - but we have a buffer, provided
- by our caller, that is the right size for the data that is
- wanted. For the following scm_i_fill_input_unlocked calls,
- therefore, we use the buffer in hand as the port's read buffer.
- We need to make sure that the port's normal (1 byte) buffer is
- reinstated in case one of the scm_i_fill_input_unlocked ()
- calls throws an exception; we use the scm_dynwind_* API to
- achieve that.
- A consequence of this optimization is that the fill_input
- functions can't unget characters. That'll push data to the
- pushback buffer instead of this psb buffer. */
- #if SCM_DEBUG == 1
- unsigned char *pback = pt->putback_buf;
- #endif
- psb.pt = pt;
- psb.buffer = buffer;
- psb.size = size;
- scm_dynwind_begin (SCM_F_DYNWIND_REWINDABLE);
- scm_dynwind_rewind_handler (swap_buffer, &psb, SCM_F_WIND_EXPLICITLY);
- scm_dynwind_unwind_handler (swap_buffer, &psb, SCM_F_WIND_EXPLICITLY);
- /* Call scm_i_fill_input_unlocked until we have all the bytes that
- we need, or we hit EOF. */
- while (pt->read_buf_size && (scm_i_fill_input_unlocked (port) != EOF))
- {
- pt->read_buf_size -= (pt->read_end - pt->read_pos);
- pt->read_pos = pt->read_buf = pt->read_end;
- }
- #if SCM_DEBUG == 1
- if (pback != pt->putback_buf
- || pt->read_buf - (unsigned char *) buffer < 0)
- scm_misc_error (FUNC_NAME,
- "scm_c_read must not call a fill function that pushes "
- "back characters onto an unbuffered port", SCM_EOL);
- #endif
- n_read += pt->read_buf - (unsigned char *) buffer;
-
- /* Reinstate the port's normal buffer. */
- scm_dynwind_end ();
- }
- else
- {
- /* The port has its own buffer. It is important that we use it,
- even if it happens to be smaller than our caller's buffer, so
- that a custom port implementation's entry points (in
- particular, fill_input) can rely on the buffer always being
- the same as they first set up. */
- while (size && (scm_i_fill_input_unlocked (port) != EOF))
- {
- n_available = min (size, pt->read_end - pt->read_pos);
- memcpy (buffer, pt->read_pos, n_available);
- buffer = (char *) buffer + n_available;
- pt->read_pos += n_available;
- n_read += n_available;
- size -= n_available;
- }
- }
- return n_read;
- }
- #undef FUNC_NAME
- size_t
- scm_c_read (SCM port, void *buffer, size_t size)
- {
- scm_i_pthread_mutex_t *lock;
- size_t ret;
- scm_c_lock_port (port, &lock);
- ret = scm_c_read_unlocked (port, buffer, size);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- return ret;
- }
- /* Update the line and column number of PORT after consumption of C. */
- static inline void
- update_port_lf (scm_t_wchar c, SCM port)
- {
- switch (c)
- {
- case '\a':
- case EOF:
- break;
- case '\b':
- SCM_DECCOL (port);
- break;
- case '\n':
- SCM_INCLINE (port);
- break;
- case '\r':
- SCM_ZEROCOL (port);
- break;
- case '\t':
- SCM_TABCOL (port);
- break;
- default:
- SCM_INCCOL (port);
- break;
- }
- }
- #define SCM_MBCHAR_BUF_SIZE (4)
- /* Convert the SIZE-byte UTF-8 sequence in UTF8_BUF to a codepoint.
- UTF8_BUF is assumed to contain a valid UTF-8 sequence. */
- static scm_t_wchar
- utf8_to_codepoint (const scm_t_uint8 *utf8_buf, size_t size)
- {
- scm_t_wchar codepoint;
- if (utf8_buf[0] <= 0x7f)
- {
- assert (size == 1);
- codepoint = utf8_buf[0];
- }
- else if ((utf8_buf[0] & 0xe0) == 0xc0)
- {
- assert (size == 2);
- codepoint = ((scm_t_wchar) utf8_buf[0] & 0x1f) << 6UL
- | (utf8_buf[1] & 0x3f);
- }
- else if ((utf8_buf[0] & 0xf0) == 0xe0)
- {
- assert (size == 3);
- codepoint = ((scm_t_wchar) utf8_buf[0] & 0x0f) << 12UL
- | ((scm_t_wchar) utf8_buf[1] & 0x3f) << 6UL
- | (utf8_buf[2] & 0x3f);
- }
- else
- {
- assert (size == 4);
- codepoint = ((scm_t_wchar) utf8_buf[0] & 0x07) << 18UL
- | ((scm_t_wchar) utf8_buf[1] & 0x3f) << 12UL
- | ((scm_t_wchar) utf8_buf[2] & 0x3f) << 6UL
- | (utf8_buf[3] & 0x3f);
- }
- return codepoint;
- }
- /* Read a UTF-8 sequence from PORT. On success, return 0 and set
- *CODEPOINT to the codepoint that was read, fill BUF with its UTF-8
- representation, and set *LEN to the length in bytes. Return
- `EILSEQ' on error. */
- static int
- get_utf8_codepoint (SCM port, scm_t_wchar *codepoint,
- scm_t_uint8 buf[SCM_MBCHAR_BUF_SIZE], size_t *len)
- {
- #define ASSERT_NOT_EOF(b) \
- if (SCM_UNLIKELY ((b) == EOF)) \
- goto invalid_seq
- #define CONSUME_PEEKED_BYTE() \
- pt->read_pos++
- int byte;
- scm_t_port *pt;
- *len = 0;
- pt = SCM_PTAB_ENTRY (port);
- byte = scm_get_byte_or_eof_unlocked (port);
- if (byte == EOF)
- {
- *codepoint = EOF;
- return 0;
- }
- buf[0] = (scm_t_uint8) byte;
- *len = 1;
- if (buf[0] <= 0x7f)
- /* 1-byte form. */
- *codepoint = buf[0];
- else if (buf[0] >= 0xc2 && buf[0] <= 0xdf)
- {
- /* 2-byte form. */
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY ((byte & 0xc0) != 0x80))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[1] = (scm_t_uint8) byte;
- *len = 2;
- *codepoint = ((scm_t_wchar) buf[0] & 0x1f) << 6UL
- | (buf[1] & 0x3f);
- }
- else if ((buf[0] & 0xf0) == 0xe0)
- {
- /* 3-byte form. */
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY ((byte & 0xc0) != 0x80
- || (buf[0] == 0xe0 && byte < 0xa0)
- || (buf[0] == 0xed && byte > 0x9f)))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[1] = (scm_t_uint8) byte;
- *len = 2;
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY ((byte & 0xc0) != 0x80))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[2] = (scm_t_uint8) byte;
- *len = 3;
- *codepoint = ((scm_t_wchar) buf[0] & 0x0f) << 12UL
- | ((scm_t_wchar) buf[1] & 0x3f) << 6UL
- | (buf[2] & 0x3f);
- }
- else if (buf[0] >= 0xf0 && buf[0] <= 0xf4)
- {
- /* 4-byte form. */
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY (((byte & 0xc0) != 0x80)
- || (buf[0] == 0xf0 && byte < 0x90)
- || (buf[0] == 0xf4 && byte > 0x8f)))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[1] = (scm_t_uint8) byte;
- *len = 2;
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY ((byte & 0xc0) != 0x80))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[2] = (scm_t_uint8) byte;
- *len = 3;
- byte = scm_peek_byte_or_eof_unlocked (port);
- ASSERT_NOT_EOF (byte);
- if (SCM_UNLIKELY ((byte & 0xc0) != 0x80))
- goto invalid_seq;
- CONSUME_PEEKED_BYTE ();
- buf[3] = (scm_t_uint8) byte;
- *len = 4;
- *codepoint = ((scm_t_wchar) buf[0] & 0x07) << 18UL
- | ((scm_t_wchar) buf[1] & 0x3f) << 12UL
- | ((scm_t_wchar) buf[2] & 0x3f) << 6UL
- | (buf[3] & 0x3f);
- }
- else
- goto invalid_seq;
- return 0;
- invalid_seq:
- /* Here we could choose the consume the faulty byte when it's not a
- valid starting byte, but it's not a requirement. What Section 3.9
- of Unicode 6.0.0 mandates, though, is to not consume a byte that
- would otherwise be a valid starting byte. */
- return EILSEQ;
- #undef CONSUME_PEEKED_BYTE
- #undef ASSERT_NOT_EOF
- }
- /* Read an ISO-8859-1 codepoint (a byte) from PORT. On success, return
- 0 and set *CODEPOINT to the codepoint that was read, fill BUF with
- its UTF-8 representation, and set *LEN to the length in bytes.
- Return `EILSEQ' on error. */
- static int
- get_latin1_codepoint (SCM port, scm_t_wchar *codepoint,
- char buf[SCM_MBCHAR_BUF_SIZE], size_t *len)
- {
- *codepoint = scm_get_byte_or_eof_unlocked (port);
- if (*codepoint == EOF)
- *len = 0;
- else
- {
- *len = 1;
- buf[0] = *codepoint;
- }
- return 0;
- }
- /* Likewise, read a byte sequence from PORT, passing it through its
- input conversion descriptor. */
- static int
- get_iconv_codepoint (SCM port, scm_t_wchar *codepoint,
- char buf[SCM_MBCHAR_BUF_SIZE], size_t *len)
- {
- scm_t_iconv_descriptors *id;
- scm_t_uint8 utf8_buf[SCM_MBCHAR_BUF_SIZE];
- size_t input_size = 0;
- id = scm_i_port_iconv_descriptors (port, SCM_PORT_READ);
- for (;;)
- {
- int byte_read;
- char *input, *output;
- size_t input_left, output_left, done;
- byte_read = scm_get_byte_or_eof_unlocked (port);
- if (SCM_UNLIKELY (byte_read == EOF))
- {
- if (SCM_LIKELY (input_size == 0))
- {
- *codepoint = (scm_t_wchar) EOF;
- *len = input_size;
- return 0;
- }
- else
- {
- /* EOF found in the middle of a multibyte character. */
- scm_i_set_pending_eof (port);
- return EILSEQ;
- }
- }
- buf[input_size++] = byte_read;
- input = buf;
- input_left = input_size;
- output = (char *) utf8_buf;
- output_left = sizeof (utf8_buf);
- done = iconv (id->input_cd, &input, &input_left, &output, &output_left);
- if (done == (size_t) -1)
- {
- int err = errno;
- if (SCM_LIKELY (err == EINVAL))
- /* The input byte sequence did not form a complete
- character. Read another byte and try again. */
- continue;
- else
- return err;
- }
- else
- {
- size_t output_size = sizeof (utf8_buf) - output_left;
- if (SCM_LIKELY (output_size > 0))
- {
- /* iconv generated output. Convert the UTF8_BUF sequence
- to a Unicode code point. */
- *codepoint = utf8_to_codepoint (utf8_buf, output_size);
- *len = input_size;
- return 0;
- }
- else
- {
- /* iconv consumed some bytes without producing any output.
- Most likely this means that a Unicode byte-order mark
- (BOM) was consumed, which should not be included in the
- returned buf. Shift any remaining bytes to the beginning
- of buf, and continue the loop. */
- memmove (buf, input, input_left);
- input_size = input_left;
- continue;
- }
- }
- }
- }
- /* Read a codepoint from PORT and return it in *CODEPOINT. Fill BUF
- with the byte representation of the codepoint in PORT's encoding, and
- set *LEN to the length in bytes of that representation. Return 0 on
- success and an errno value on error. */
- static SCM_C_INLINE int
- get_codepoint (SCM port, scm_t_wchar *codepoint,
- char buf[SCM_MBCHAR_BUF_SIZE], size_t *len)
- {
- int err;
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
- if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
- err = get_utf8_codepoint (port, codepoint, (scm_t_uint8 *) buf, len);
- else if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_LATIN1)
- err = get_latin1_codepoint (port, codepoint, buf, len);
- else
- err = get_iconv_codepoint (port, codepoint, buf, len);
- if (SCM_LIKELY (err == 0))
- {
- if (SCM_UNLIKELY (pti->at_stream_start_for_bom_read))
- {
- /* Record that we're no longer at stream start. */
- pti->at_stream_start_for_bom_read = 0;
- if (pt->rw_random)
- pti->at_stream_start_for_bom_write = 0;
- /* If we just read a BOM in an encoding that recognizes them,
- then silently consume it and read another code point. */
- if (SCM_UNLIKELY
- (*codepoint == SCM_UNICODE_BOM
- && (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8
- || strcmp (pt->encoding, "UTF-16") == 0
- || strcmp (pt->encoding, "UTF-32") == 0)))
- return get_codepoint (port, codepoint, buf, len);
- }
- update_port_lf (*codepoint, port);
- }
- else if (pt->ilseq_handler == SCM_ICONVEH_QUESTION_MARK)
- {
- *codepoint = '?';
- err = 0;
- update_port_lf (*codepoint, port);
- }
- return err;
- }
- /* Read a codepoint from PORT and return it. */
- scm_t_wchar
- scm_getc_unlocked (SCM port)
- #define FUNC_NAME "scm_getc"
- {
- int err;
- size_t len;
- scm_t_wchar codepoint;
- char buf[SCM_MBCHAR_BUF_SIZE];
- err = get_codepoint (port, &codepoint, buf, &len);
- if (SCM_UNLIKELY (err != 0))
- /* At this point PORT should point past the invalid encoding, as per
- R6RS-lib Section 8.2.4. */
- scm_decoding_error (FUNC_NAME, err, "input decoding error", port);
- return codepoint;
- }
- #undef FUNC_NAME
- scm_t_wchar
- scm_getc (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_t_wchar ret;
- scm_c_lock_port (port, &lock);
- ret = scm_getc_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- return ret;
- }
- SCM_DEFINE (scm_read_char, "read-char", 0, 1, 0,
- (SCM port),
- "Return the next character available from @var{port}, updating\n"
- "@var{port} to point to the following character. If no more\n"
- "characters are available, the end-of-file object is returned.\n"
- "\n"
- "When @var{port}'s data cannot be decoded according to its\n"
- "character encoding, a @code{decoding-error} is raised and\n"
- "@var{port} points past the erroneous byte sequence.\n")
- #define FUNC_NAME s_scm_read_char
- {
- scm_t_wchar c;
- if (SCM_UNBNDP (port))
- port = scm_current_input_port ();
- SCM_VALIDATE_OPINPORT (1, port);
- c = scm_getc_unlocked (port);
- if (EOF == c)
- return SCM_EOF_VAL;
- return SCM_MAKE_CHAR (c);
- }
- #undef FUNC_NAME
- /* Pushback. */
- static void
- scm_i_unget_bytes_unlocked (const unsigned char *buf, size_t len, SCM port)
- #define FUNC_NAME "scm_unget_bytes"
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- size_t old_len, new_len;
- scm_i_clear_pending_eof (port);
- if (pt->read_buf != pt->putback_buf)
- /* switch to the put-back buffer. */
- {
- if (pt->putback_buf == NULL)
- {
- pt->putback_buf_size = (len > SCM_INITIAL_PUTBACK_BUF_SIZE
- ? len : SCM_INITIAL_PUTBACK_BUF_SIZE);
- pt->putback_buf
- = (unsigned char *) scm_gc_malloc_pointerless
- (pt->putback_buf_size, "putback buffer");
- }
- pt->saved_read_buf = pt->read_buf;
- pt->saved_read_pos = pt->read_pos;
- pt->saved_read_end = pt->read_end;
- pt->saved_read_buf_size = pt->read_buf_size;
- /* Put read_pos at the end of the buffer, so that ungets will not
- have to shift the buffer contents each time. */
- pt->read_buf = pt->putback_buf;
- pt->read_pos = pt->read_end = pt->putback_buf + pt->putback_buf_size;
- pt->read_buf_size = pt->putback_buf_size;
- }
- old_len = pt->read_end - pt->read_pos;
- new_len = old_len + len;
- if (new_len > pt->read_buf_size)
- /* The putback buffer needs to be enlarged. */
- {
- size_t new_buf_size;
- unsigned char *new_buf, *new_end, *new_pos;
- new_buf_size = pt->read_buf_size * 2;
- if (new_buf_size < new_len)
- new_buf_size = new_len;
- new_buf = (unsigned char *)
- scm_gc_malloc_pointerless (new_buf_size, "putback buffer");
- /* Put the bytes at the end of the buffer, so that future
- ungets won't need to shift the buffer. */
- new_end = new_buf + new_buf_size;
- new_pos = new_end - old_len;
- memcpy (new_pos, pt->read_pos, old_len);
- pt->read_buf = pt->putback_buf = new_buf;
- pt->read_pos = new_pos;
- pt->read_end = new_end;
- pt->read_buf_size = pt->putback_buf_size = new_buf_size;
- }
- else if (pt->read_buf + len < pt->read_pos)
- /* If needed, shift the existing buffer contents up.
- This should not happen unless some external code
- manipulates the putback buffer pointers. */
- {
- unsigned char *new_end = pt->read_buf + pt->read_buf_size;
- unsigned char *new_pos = new_end - old_len;
- memmove (new_pos, pt->read_pos, old_len);
- pt->read_pos = new_pos;
- pt->read_end = new_end;
- }
- /* Move read_pos back and copy the bytes there. */
- pt->read_pos -= len;
- memcpy (pt->read_buf + (pt->read_pos - pt->read_buf), buf, len);
- if (pt->rw_active == SCM_PORT_WRITE)
- scm_flush (port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_READ;
- }
- #undef FUNC_NAME
- void
- scm_unget_bytes_unlocked (const unsigned char *buf, size_t len, SCM port)
- {
- scm_i_unget_bytes_unlocked (buf, len, port);
- }
- void
- scm_unget_byte_unlocked (int c, SCM port)
- {
- unsigned char byte = c;
- scm_i_unget_bytes_unlocked (&byte, 1, port);
- }
- void
- scm_unget_bytes (const unsigned char *buf, size_t len, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_i_unget_bytes_unlocked (buf, len, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- }
- void
- scm_unget_byte (int c, SCM port)
- {
- unsigned char byte = c;
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_i_unget_bytes_unlocked (&byte, 1, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
- }
- void
- scm_ungetc_unlocked (scm_t_wchar c, SCM port)
- #define FUNC_NAME "scm_ungetc"
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
- char *result;
- char result_buf[10];
- size_t len;
- len = sizeof (result_buf);
- if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
- {
- if (c < 0x80)
- {
- result_buf[0] = (char) c;
- result = result_buf;
- len = 1;
- }
- else
- result =
- (char *) u32_to_u8 ((uint32_t *) &c, 1, (uint8_t *) result_buf, &len);
- }
- else if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_LATIN1 && c <= 0xff)
- {
- result_buf[0] = (char) c;
- result = result_buf;
- len = 1;
- }
- else
- result = u32_conv_to_encoding (pt->encoding,
- (enum iconv_ilseq_handler) pt->ilseq_handler,
- (uint32_t *) &c, 1, NULL,
- result_buf, &len);
- if (SCM_UNLIKELY (result == NULL || len == 0))
- scm_encoding_error (FUNC_NAME, errno,
- "conversion to port encoding failed",
- SCM_BOOL_F, SCM_MAKE_CHAR (c));
- scm_i_unget_bytes_unlocked ((unsigned char *) result, len, port);
- if (SCM_UNLIKELY (result != result_buf))
- free (result);
- if (c == '\n')
- SCM_LINUM (port) -= 1;
- SCM_DECCOL (port);
- }
- #undef FUNC_NAME
- void
- scm_ungetc (scm_t_wchar c, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_ungetc_unlocked (c, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- void
- scm_ungets_unlocked (const char *s, int n, SCM port)
- {
- /* This is simple minded and inefficient, but unreading strings is
- * probably not a common operation, and remember that line and
- * column numbers have to be handled...
- *
- * Please feel free to write an optimized version!
- */
- while (n--)
- scm_ungetc_unlocked (s[n], port);
- }
- void
- scm_ungets (const char *s, int n, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_ungets_unlocked (s, n, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- SCM_DEFINE (scm_peek_char, "peek-char", 0, 1, 0,
- (SCM port),
- "Return the next character available from @var{port},\n"
- "@emph{without} updating @var{port} to point to the following\n"
- "character. If no more characters are available, the\n"
- "end-of-file object is returned.\n"
- "\n"
- "The value returned by\n"
- "a call to @code{peek-char} is the same as the value that would\n"
- "have been returned by a call to @code{read-char} on the same\n"
- "port. The only difference is that the very next call to\n"
- "@code{read-char} or @code{peek-char} on that @var{port} will\n"
- "return the value returned by the preceding call to\n"
- "@code{peek-char}. In particular, a call to @code{peek-char} on\n"
- "an interactive port will hang waiting for input whenever a call\n"
- "to @code{read-char} would have hung.\n"
- "\n"
- "As for @code{read-char}, a @code{decoding-error} may be raised\n"
- "if such a situation occurs. However, unlike with @code{read-char},\n"
- "@var{port} still points at the beginning of the erroneous byte\n"
- "sequence when the error is raised.\n")
- #define FUNC_NAME s_scm_peek_char
- {
- int err;
- SCM result;
- scm_t_wchar c;
- char bytes[SCM_MBCHAR_BUF_SIZE];
- long column, line;
- size_t len = 0;
- if (SCM_UNBNDP (port))
- port = scm_current_input_port ();
- SCM_VALIDATE_OPINPORT (1, port);
- column = SCM_COL (port);
- line = SCM_LINUM (port);
- err = get_codepoint (port, &c, bytes, &len);
- scm_i_unget_bytes_unlocked ((unsigned char *) bytes, len, port);
- SCM_COL (port) = column;
- SCM_LINUM (port) = line;
- if (SCM_UNLIKELY (err != 0))
- {
- scm_decoding_error (FUNC_NAME, err, "input decoding error", port);
- /* Shouldn't happen since `catch' always aborts to prompt. */
- result = SCM_BOOL_F;
- }
- else if (c == EOF)
- {
- scm_i_set_pending_eof (port);
- result = SCM_EOF_VAL;
- }
- else
- result = SCM_MAKE_CHAR (c);
- return result;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_unread_char, "unread-char", 1, 1, 0,
- (SCM cobj, SCM port),
- "Place character @var{cobj} in @var{port} so that it will be\n"
- "read by the next read operation. If called multiple times, the\n"
- "unread characters will be read again in last-in first-out\n"
- "order. If @var{port} is not supplied, the current input port\n"
- "is used.")
- #define FUNC_NAME s_scm_unread_char
- {
- int c;
- SCM_VALIDATE_CHAR (1, cobj);
- if (SCM_UNBNDP (port))
- port = scm_current_input_port ();
- SCM_VALIDATE_OPINPORT (2, port);
- c = SCM_CHAR (cobj);
- scm_ungetc_unlocked (c, port);
- return cobj;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_unread_string, "unread-string", 2, 0, 0,
- (SCM str, SCM port),
- "Place the string @var{str} in @var{port} so that its characters will be\n"
- "read in subsequent read operations. If called multiple times, the\n"
- "unread characters will be read again in last-in first-out order. If\n"
- "@var{port} is not supplied, the current-input-port is used.")
- #define FUNC_NAME s_scm_unread_string
- {
- int n;
- SCM_VALIDATE_STRING (1, str);
- if (SCM_UNBNDP (port))
- port = scm_current_input_port ();
- SCM_VALIDATE_OPINPORT (2, port);
- n = scm_i_string_length (str);
- while (n--)
- scm_ungetc_unlocked (scm_i_string_ref (str, n), port);
-
- return str;
- }
- #undef FUNC_NAME
- /* Manipulating the buffers. */
- /* This routine does not take any locks, as it is usually called as part
- of a port implementation. */
- void
- scm_port_non_buffer (scm_t_port *pt)
- {
- pt->read_pos = pt->read_buf = pt->read_end = &pt->shortbuf;
- pt->write_buf = pt->write_pos = &pt->shortbuf;
- pt->read_buf_size = pt->write_buf_size = 1;
- pt->write_end = pt->write_buf + pt->write_buf_size;
- }
- /* this should only be called when the read buffer is empty. it
- tries to refill the read buffer. it returns the first char from
- the port, which is either EOF or *(pt->read_pos). */
- static int
- scm_i_fill_input_unlocked (SCM port)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
- assert (pt->read_pos == pt->read_end);
- if (pti->pending_eof)
- {
- pti->pending_eof = 0;
- return EOF;
- }
- if (pt->read_buf == pt->putback_buf)
- {
- /* finished reading put-back chars. */
- pt->read_buf = pt->saved_read_buf;
- pt->read_pos = pt->saved_read_pos;
- pt->read_end = pt->saved_read_end;
- pt->read_buf_size = pt->saved_read_buf_size;
- if (pt->read_pos < pt->read_end)
- return *(pt->read_pos);
- }
- return SCM_PORT_DESCRIPTOR (port)->fill_input (port);
- }
- int
- scm_fill_input (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- int ret;
-
- scm_c_lock_port (port, &lock);
- ret = scm_fill_input_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- return ret;
- }
- /* Slow-path fallback for 'scm_get_byte_or_eof_unlocked' */
- int
- scm_slow_get_byte_or_eof_unlocked (SCM port)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- if (pt->rw_active == SCM_PORT_WRITE)
- scm_flush_unlocked (port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_READ;
- if (pt->read_pos >= pt->read_end)
- {
- if (SCM_UNLIKELY (scm_i_fill_input_unlocked (port) == EOF))
- return EOF;
- }
- return *pt->read_pos++;
- }
- /* Slow-path fallback for 'scm_peek_byte_or_eof_unlocked' */
- int
- scm_slow_peek_byte_or_eof_unlocked (SCM port)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- if (pt->rw_active == SCM_PORT_WRITE)
- scm_flush_unlocked (port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_READ;
- if (pt->read_pos >= pt->read_end)
- {
- if (SCM_UNLIKELY (scm_i_fill_input_unlocked (port) == EOF))
- {
- scm_i_set_pending_eof (port);
- return EOF;
- }
- }
- return *pt->read_pos;
- }
- /* Move up to READ_LEN bytes from PORT's putback and/or read buffers
- into memory starting at DEST. Return the number of bytes moved.
- PORT's line/column numbers are left unchanged. */
- size_t
- scm_take_from_input_buffers (SCM port, char *dest, size_t read_len)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- size_t bytes_read = 0;
- size_t from_buf = min (pt->read_end - pt->read_pos, read_len);
- if (from_buf > 0)
- {
- memcpy (dest, pt->read_pos, from_buf);
- pt->read_pos += from_buf;
- bytes_read += from_buf;
- read_len -= from_buf;
- dest += from_buf;
- }
- /* if putback was active, try the real input buffer too. */
- if (pt->read_buf == pt->putback_buf)
- {
- from_buf = min (pt->saved_read_end - pt->saved_read_pos, read_len);
- if (from_buf > 0)
- {
- memcpy (dest, pt->saved_read_pos, from_buf);
- pt->saved_read_pos += from_buf;
- bytes_read += from_buf;
- }
- }
- return bytes_read;
- }
- /* Clear a port's read buffers, returning the contents. */
- SCM_DEFINE (scm_drain_input, "drain-input", 1, 0, 0,
- (SCM port),
- "This procedure clears a port's input buffers, similar\n"
- "to the way that force-output clears the output buffer. The\n"
- "contents of the buffers are returned as a single string, e.g.,\n"
- "\n"
- "@lisp\n"
- "(define p (open-input-file ...))\n"
- "(drain-input p) => empty string, nothing buffered yet.\n"
- "(unread-char (read-char p) p)\n"
- "(drain-input p) => initial chars from p, up to the buffer size.\n"
- "@end lisp\n\n"
- "Draining the buffers may be useful for cleanly finishing\n"
- "buffered I/O so that the file descriptor can be used directly\n"
- "for further input.")
- #define FUNC_NAME s_scm_drain_input
- {
- SCM result;
- char *data;
- scm_t_port *pt;
- long count;
- SCM_VALIDATE_OPINPORT (1, port);
- pt = SCM_PTAB_ENTRY (port);
- count = pt->read_end - pt->read_pos;
- if (pt->read_buf == pt->putback_buf)
- count += pt->saved_read_end - pt->saved_read_pos;
- if (count)
- {
- result = scm_i_make_string (count, &data, 0);
- scm_take_from_input_buffers (port, data, count);
- }
- else
- result = scm_nullstr;
-
- return result;
- }
- #undef FUNC_NAME
- void
- scm_end_input_unlocked (SCM port)
- {
- long offset;
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- scm_i_clear_pending_eof (port);
- if (pt->read_buf == pt->putback_buf)
- {
- offset = pt->read_end - pt->read_pos;
- pt->read_buf = pt->saved_read_buf;
- pt->read_pos = pt->saved_read_pos;
- pt->read_end = pt->saved_read_end;
- pt->read_buf_size = pt->saved_read_buf_size;
- }
- else
- offset = 0;
- SCM_PORT_DESCRIPTOR (port)->end_input (port, offset);
- }
- void
- scm_end_input (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_end_input_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- SCM_DEFINE (scm_force_output, "force-output", 0, 1, 0,
- (SCM port),
- "Flush the specified output port, or the current output port if @var{port}\n"
- "is omitted. The current output buffer contents are passed to the\n"
- "underlying port implementation (e.g., in the case of fports, the\n"
- "data will be written to the file and the output buffer will be cleared.)\n"
- "It has no effect on an unbuffered port.\n\n"
- "The return value is unspecified.")
- #define FUNC_NAME s_scm_force_output
- {
- if (SCM_UNBNDP (port))
- port = scm_current_output_port ();
- else
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPOUTPORT (1, port);
- }
- scm_flush_unlocked (port);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- void
- scm_flush_unlocked (SCM port)
- {
- SCM_PORT_DESCRIPTOR (port)->flush (port);
- }
- void
- scm_flush (SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_flush_unlocked (port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- int
- scm_fill_input_unlocked (SCM port)
- {
- return scm_i_fill_input_unlocked (port);
- }
- /* Output. */
- void
- scm_putc (char c, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_putc_unlocked (c, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- void
- scm_puts (const char *s, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_puts_unlocked (s, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
-
- /* scm_c_write
- *
- * Used by an application to write arbitrary number of bytes to an SCM
- * port. Similar semantics as libc write. However, unlike libc
- * write, scm_c_write writes the requested number of bytes and has no
- * return value.
- *
- * Warning: Doesn't update port line and column counts!
- */
- void
- scm_c_write_unlocked (SCM port, const void *ptr, size_t size)
- #define FUNC_NAME "scm_c_write"
- {
- scm_t_port *pt;
- scm_t_ptob_descriptor *ptob;
- SCM_VALIDATE_OPOUTPORT (1, port);
- pt = SCM_PTAB_ENTRY (port);
- ptob = SCM_PORT_DESCRIPTOR (port);
- if (pt->rw_active == SCM_PORT_READ)
- scm_end_input_unlocked (port);
- ptob->write (port, ptr, size);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_WRITE;
- }
- #undef FUNC_NAME
- void
- scm_c_write (SCM port, const void *ptr, size_t size)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_c_write_unlocked (port, ptr, size);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- /* scm_lfwrite
- *
- * This function differs from scm_c_write; it updates port line and
- * column. */
- void
- scm_lfwrite_unlocked (const char *ptr, size_t size, SCM port)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (port);
- if (pt->rw_active == SCM_PORT_READ)
- scm_end_input_unlocked (port);
- ptob->write (port, ptr, size);
- for (; size; ptr++, size--)
- update_port_lf ((scm_t_wchar) (unsigned char) *ptr, port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_WRITE;
- }
- void
- scm_lfwrite (const char *ptr, size_t size, SCM port)
- {
- scm_i_pthread_mutex_t *lock;
- scm_c_lock_port (port, &lock);
- scm_lfwrite_unlocked (ptr, size, port);
- if (lock)
- scm_i_pthread_mutex_unlock (lock);
-
- }
- /* Write STR to PORT from START inclusive to END exclusive. */
- void
- scm_lfwrite_substr (SCM str, size_t start, size_t end, SCM port)
- {
- scm_t_port *pt = SCM_PTAB_ENTRY (port);
- if (pt->rw_active == SCM_PORT_READ)
- scm_end_input_unlocked (port);
- if (end == (size_t) -1)
- end = scm_i_string_length (str);
- scm_i_display_substring (str, start, end, port);
- if (pt->rw_random)
- pt->rw_active = SCM_PORT_WRITE;
- }
- /* Querying and setting positions, and character availability. */
- SCM_DEFINE (scm_char_ready_p, "char-ready?", 0, 1, 0,
- (SCM port),
- "Return @code{#t} if a character is ready on input @var{port}\n"
- "and return @code{#f} otherwise. If @code{char-ready?} returns\n"
- "@code{#t} then the next @code{read-char} operation on\n"
- "@var{port} is guaranteed not to hang. If @var{port} is a file\n"
- "port at end of file then @code{char-ready?} returns @code{#t}.\n"
- "\n"
- "@code{char-ready?} exists to make it possible for a\n"
- "program to accept characters from interactive ports without\n"
- "getting stuck waiting for input. Any input editors associated\n"
- "with such ports must make sure that characters whose existence\n"
- "has been asserted by @code{char-ready?} cannot be rubbed out.\n"
- "If @code{char-ready?} were to return @code{#f} at end of file,\n"
- "a port at end of file would be indistinguishable from an\n"
- "interactive port that has no ready characters.")
- #define FUNC_NAME s_scm_char_ready_p
- {
- scm_t_port *pt;
- if (SCM_UNBNDP (port))
- port = scm_current_input_port ();
- /* It's possible to close the current input port, so validate even in
- this case. */
- SCM_VALIDATE_OPINPORT (1, port);
- pt = SCM_PTAB_ENTRY (port);
- /* if the current read buffer is filled, or the
- last pushed-back char has been read and the saved buffer is
- filled, result is true. */
- if (pt->read_pos < pt->read_end
- || (pt->read_buf == pt->putback_buf
- && pt->saved_read_pos < pt->saved_read_end))
- return SCM_BOOL_T;
- else
- {
- scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (port);
-
- if (ptob->input_waiting)
- return scm_from_bool(ptob->input_waiting (port));
- else
- return SCM_BOOL_T;
- }
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_seek, "seek", 3, 0, 0,
- (SCM fd_port, SCM offset, SCM whence),
- "Sets the current position of @var{fd_port} to the integer\n"
- "@var{offset}, which is interpreted according to the value of\n"
- "@var{whence}.\n"
- "\n"
- "One of the following variables should be supplied for\n"
- "@var{whence}:\n"
- "@defvar SEEK_SET\n"
- "Seek from the beginning of the file.\n"
- "@end defvar\n"
- "@defvar SEEK_CUR\n"
- "Seek from the current position.\n"
- "@end defvar\n"
- "@defvar SEEK_END\n"
- "Seek from the end of the file.\n"
- "@end defvar\n"
- "If @var{fd_port} is a file descriptor, the underlying system\n"
- "call is @code{lseek}. @var{port} may be a string port.\n"
- "\n"
- "The value returned is the new position in the file. This means\n"
- "that the current position of a port can be obtained using:\n"
- "@lisp\n"
- "(seek port 0 SEEK_CUR)\n"
- "@end lisp")
- #define FUNC_NAME s_scm_seek
- {
- int how;
- fd_port = SCM_COERCE_OUTPORT (fd_port);
- how = scm_to_int (whence);
- if (how != SEEK_SET && how != SEEK_CUR && how != SEEK_END)
- SCM_OUT_OF_RANGE (3, whence);
- if (SCM_OPPORTP (fd_port))
- {
- scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (fd_port);
- scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (fd_port);
- off_t_or_off64_t off = scm_to_off_t_or_off64_t (offset);
- off_t_or_off64_t rv;
- if (!ptob->seek)
- SCM_MISC_ERROR ("port is not seekable",
- scm_cons (fd_port, SCM_EOL));
- else
- rv = ptob->seek (fd_port, off, how);
- /* Set stream-start flags according to new position. */
- pti->at_stream_start_for_bom_read = (rv == 0);
- pti->at_stream_start_for_bom_write = (rv == 0);
- scm_i_clear_pending_eof (fd_port);
- return scm_from_off_t_or_off64_t (rv);
- }
- else /* file descriptor?. */
- {
- off_t_or_off64_t off = scm_to_off_t_or_off64_t (offset);
- off_t_or_off64_t rv;
- rv = lseek_or_lseek64 (scm_to_int (fd_port), off, how);
- if (rv == -1)
- SCM_SYSERROR;
- return scm_from_off_t_or_off64_t (rv);
- }
- }
- #undef FUNC_NAME
- #ifndef O_BINARY
- #define O_BINARY 0
- #endif
- /* Mingw has ftruncate(), perhaps implemented above using chsize, but
- doesn't have the filename version truncate(), hence this code. */
- #if HAVE_FTRUNCATE && ! HAVE_TRUNCATE
- static int
- truncate (const char *file, off_t length)
- {
- int ret, fdes;
- fdes = open (file, O_BINARY | O_WRONLY);
- if (fdes == -1)
- return -1;
- ret = ftruncate (fdes, length);
- if (ret == -1)
- {
- int save_errno = errno;
- close (fdes);
- errno = save_errno;
- return -1;
- }
- return close (fdes);
- }
- #endif /* HAVE_FTRUNCATE && ! HAVE_TRUNCATE */
- SCM_DEFINE (scm_truncate_file, "truncate-file", 1, 1, 0,
- (SCM object, SCM length),
- "Truncate file @var{object} to @var{length} bytes. @var{object}\n"
- "can be a filename string, a port object, or an integer file\n"
- "descriptor.\n"
- "The return value is unspecified.\n"
- "\n"
- "For a port or file descriptor @var{length} can be omitted, in\n"
- "which case the file is truncated at the current position (per\n"
- "@code{ftell} above).\n"
- "\n"
- "On most systems a file can be extended by giving a length\n"
- "greater than the current size, but this is not mandatory in the\n"
- "POSIX standard.")
- #define FUNC_NAME s_scm_truncate_file
- {
- int rv;
- /* "object" can be a port, fdes or filename.
- Negative "length" makes no sense, but it's left to truncate() or
- ftruncate() to give back an error for that (normally EINVAL).
- */
- if (SCM_UNBNDP (length))
- {
- /* must supply length if object is a filename. */
- if (scm_is_string (object))
- SCM_MISC_ERROR("must supply length if OBJECT is a filename", SCM_EOL);
-
- length = scm_seek (object, SCM_INUM0, scm_from_int (SEEK_CUR));
- }
- object = SCM_COERCE_OUTPORT (object);
- if (scm_is_integer (object))
- {
- off_t_or_off64_t c_length = scm_to_off_t_or_off64_t (length);
- SCM_SYSCALL (rv = ftruncate_or_ftruncate64 (scm_to_int (object),
- c_length));
- }
- else if (SCM_OPOUTPORTP (object))
- {
- off_t_or_off64_t c_length = scm_to_off_t_or_off64_t (length);
- scm_t_port *pt = SCM_PTAB_ENTRY (object);
- scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (object);
- if (!ptob->truncate)
- SCM_MISC_ERROR ("port is not truncatable", SCM_EOL);
- scm_i_clear_pending_eof (object);
- if (pt->rw_active == SCM_PORT_READ)
- scm_end_input_unlocked (object);
- else if (pt->rw_active == SCM_PORT_WRITE)
- ptob->flush (object);
- ptob->truncate (object, c_length);
- rv = 0;
- }
- else
- {
- off_t_or_off64_t c_length = scm_to_off_t_or_off64_t (length);
- char *str = scm_to_locale_string (object);
- int eno;
- SCM_SYSCALL (rv = truncate_or_truncate64 (str, c_length));
- eno = errno;
- free (str);
- errno = eno;
- }
- if (rv == -1)
- SCM_SYSERROR;
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_port_line, "port-line", 1, 0, 0,
- (SCM port),
- "Return the current line number for @var{port}.\n"
- "\n"
- "The first line of a file is 0. But you might want to add 1\n"
- "when printing line numbers, since starting from 1 is\n"
- "traditional in error messages, and likely to be more natural to\n"
- "non-programmers.")
- #define FUNC_NAME s_scm_port_line
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- return scm_from_long (SCM_LINUM (port));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_port_line_x, "set-port-line!", 2, 0, 0,
- (SCM port, SCM line),
- "Set the current line number for @var{port} to @var{line}. The\n"
- "first line of a file is 0.")
- #define FUNC_NAME s_scm_set_port_line_x
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- SCM_PTAB_ENTRY (port)->line_number = scm_to_long (line);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_port_column, "port-column", 1, 0, 0,
- (SCM port),
- "Return the current column number of @var{port}.\n"
- "If the number is\n"
- "unknown, the result is #f. Otherwise, the result is a 0-origin integer\n"
- "- i.e. the first character of the first line is line 0, column 0.\n"
- "(However, when you display a file position, for example in an error\n"
- "message, we recommend you add 1 to get 1-origin integers. This is\n"
- "because lines and column numbers traditionally start with 1, and that is\n"
- "what non-programmers will find most natural.)")
- #define FUNC_NAME s_scm_port_column
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- return scm_from_int (SCM_COL (port));
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_port_column_x, "set-port-column!", 2, 0, 0,
- (SCM port, SCM column),
- "Set the current column of @var{port}. Before reading the first\n"
- "character on a line the column should be 0.")
- #define FUNC_NAME s_scm_set_port_column_x
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- SCM_PTAB_ENTRY (port)->column_number = scm_to_int (column);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_port_filename, "port-filename", 1, 0, 0,
- (SCM port),
- "Return the filename associated with @var{port}, or @code{#f}\n"
- "if no filename is associated with the port.")
- #define FUNC_NAME s_scm_port_filename
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- return SCM_FILENAME (port);
- }
- #undef FUNC_NAME
- SCM_DEFINE (scm_set_port_filename_x, "set-port-filename!", 2, 0, 0,
- (SCM port, SCM filename),
- "Change the filename associated with @var{port}, using the current input\n"
- "port if none is specified. Note that this does not change the port's\n"
- "source of data, but only the value that is returned by\n"
- "@code{port-filename} and reported in diagnostic output.")
- #define FUNC_NAME s_scm_set_port_filename_x
- {
- port = SCM_COERCE_OUTPORT (port);
- SCM_VALIDATE_OPENPORT (1, port);
- /* We allow the user to set the filename to whatever he likes. */
- SCM_SET_FILENAME (port, filename);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* Implementation helpers for port printing functions. */
- void
- scm_print_port_mode (SCM exp, SCM port)
- {
- scm_puts_unlocked (SCM_CLOSEDP (exp)
- ? "closed: "
- : (SCM_RDNG & SCM_CELL_WORD_0 (exp)
- ? (SCM_WRTNG & SCM_CELL_WORD_0 (exp)
- ? "input-output: "
- : "input: ")
- : (SCM_WRTNG & SCM_CELL_WORD_0 (exp)
- ? "output: "
- : "bogus: ")),
- port);
- }
- int
- scm_port_print (SCM exp, SCM port, scm_print_state *pstate SCM_UNUSED)
- {
- char *type = SCM_PTOBNAME (SCM_PTOBNUM (exp));
- if (!type)
- type = "port";
- scm_puts_unlocked ("#<", port);
- scm_print_port_mode (exp, port);
- scm_puts_unlocked (type, port);
- scm_putc_unlocked (' ', port);
- scm_uintprint (SCM_CELL_WORD_1 (exp), 16, port);
- scm_putc_unlocked ('>', port);
- return 1;
- }
- /* Iterating over all ports. */
- struct for_each_data
- {
- void (*proc) (void *data, SCM p);
- void *data;
- };
- static SCM
- for_each_trampoline (void *data, SCM port, SCM result)
- {
- struct for_each_data *d = data;
-
- d->proc (d->data, port);
- return result;
- }
- void
- scm_c_port_for_each (void (*proc)(void *data, SCM p), void *data)
- {
- struct for_each_data d;
-
- d.proc = proc;
- d.data = data;
- scm_c_weak_set_fold (for_each_trampoline, &d, SCM_EOL,
- scm_i_port_weak_set);
- }
- static void
- scm_for_each_trampoline (void *data, SCM port)
- {
- scm_call_1 (SCM_PACK_POINTER (data), port);
- }
- SCM_DEFINE (scm_port_for_each, "port-for-each", 1, 0, 0,
- (SCM proc),
- "Apply @var{proc} to each port in the Guile port table\n"
- "in turn. The return value is unspecified. More specifically,\n"
- "@var{proc} is applied exactly once to every port that exists\n"
- "in the system at the time @code{port-for-each} is invoked.\n"
- "Changes to the port table while @code{port-for-each} is running\n"
- "have no effect as far as @code{port-for-each} is concerned.")
- #define FUNC_NAME s_scm_port_for_each
- {
- SCM_VALIDATE_PROC (1, proc);
- scm_c_port_for_each (scm_for_each_trampoline, SCM_UNPACK_POINTER (proc));
-
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- static void
- flush_output_port (void *closure, SCM port)
- {
- if (SCM_OPOUTPORTP (port))
- scm_flush_unlocked (port);
- }
- SCM_DEFINE (scm_flush_all_ports, "flush-all-ports", 0, 0, 0,
- (),
- "Equivalent to calling @code{force-output} on\n"
- "all open output ports. The return value is unspecified.")
- #define FUNC_NAME s_scm_flush_all_ports
- {
- scm_c_port_for_each (&flush_output_port, NULL);
- return SCM_UNSPECIFIED;
- }
- #undef FUNC_NAME
- /* Void ports. */
- scm_t_bits scm_tc16_void_port = 0;
- static int fill_input_void_port (SCM port SCM_UNUSED)
- {
- return EOF;
- }
- static void
- write_void_port (SCM port SCM_UNUSED,
- const void *data SCM_UNUSED,
- size_t size SCM_UNUSED)
- {
- }
- static SCM
- scm_i_void_port (long mode_bits)
- {
- SCM ret;
- ret = scm_c_make_port (scm_tc16_void_port, mode_bits, 0);
- scm_port_non_buffer (SCM_PTAB_ENTRY (ret));
-
- return ret;
- }
- SCM
- scm_void_port (char *mode_str)
- {
- return scm_i_void_port (scm_mode_bits (mode_str));
- }
- SCM_DEFINE (scm_sys_make_void_port, "%make-void-port", 1, 0, 0,
- (SCM mode),
- "Create and return a new void port. A void port acts like\n"
- "@file{/dev/null}. The @var{mode} argument\n"
- "specifies the input/output modes for this port: see the\n"
- "documentation for @code{open-file} in @ref{File Ports}.")
- #define FUNC_NAME s_scm_sys_make_void_port
- {
- return scm_i_void_port (scm_i_mode_bits (mode));
- }
- #undef FUNC_NAME
- /* Initialization. */
- void
- scm_init_ports ()
- {
- /* lseek() symbols. */
- scm_c_define ("SEEK_SET", scm_from_int (SEEK_SET));
- scm_c_define ("SEEK_CUR", scm_from_int (SEEK_CUR));
- scm_c_define ("SEEK_END", scm_from_int (SEEK_END));
- scm_tc16_void_port = scm_make_port_type ("void", fill_input_void_port,
- write_void_port);
- cur_inport_fluid = scm_make_fluid ();
- cur_outport_fluid = scm_make_fluid ();
- cur_errport_fluid = scm_make_fluid ();
- cur_warnport_fluid = scm_make_fluid ();
- cur_loadport_fluid = scm_make_fluid ();
- scm_i_port_weak_set = scm_c_make_weak_set (31);
- #include "libguile/ports.x"
- /* Use Latin-1 as the default port encoding. */
- SCM_VARIABLE_SET (default_port_encoding_var,
- scm_make_fluid_with_default (SCM_BOOL_F));
- scm_port_encoding_init = 1;
- SCM_VARIABLE_SET (default_conversion_strategy_var,
- scm_make_fluid_with_default (sym_substitute));
- scm_conversion_strategy_init = 1;
- /* These bindings are used when boot-9 turns `current-input-port' et
- al into parameters. They are then removed from the guile module. */
- scm_c_define ("%current-input-port-fluid", cur_inport_fluid);
- scm_c_define ("%current-output-port-fluid", cur_outport_fluid);
- scm_c_define ("%current-error-port-fluid", cur_errport_fluid);
- scm_c_define ("%current-warning-port-fluid", cur_warnport_fluid);
- }
- /*
- Local Variables:
- c-file-style: "gnu"
- End:
- */
|