123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164 |
- /*
- * entities.c : implementation for the XML entities handling
- *
- * See Copyright for the status of this software.
- *
- * daniel@veillard.com
- */
- /* To avoid EBCDIC trouble when parsing on zOS */
- #if defined(__MVS__)
- #pragma convert("ISO8859-1")
- #endif
- #define IN_LIBXML
- #include "libxml.h"
- #include <string.h>
- #ifdef HAVE_STDLIB_H
- #include <stdlib.h>
- #endif
- #include <libxml/xmlmemory.h>
- #include <libxml/hash.h>
- #include <libxml/entities.h>
- #include <libxml/parser.h>
- #include <libxml/parserInternals.h>
- #include <libxml/xmlerror.h>
- #include <libxml/globals.h>
- #include <libxml/dict.h>
- #include "save.h"
- /*
- * The XML predefined entities.
- */
- static xmlEntity xmlEntityLt = {
- NULL, XML_ENTITY_DECL, BAD_CAST "lt",
- NULL, NULL, NULL, NULL, NULL, NULL,
- BAD_CAST "<", BAD_CAST "<", 1,
- XML_INTERNAL_PREDEFINED_ENTITY,
- NULL, NULL, NULL, NULL, 0, 1
- };
- static xmlEntity xmlEntityGt = {
- NULL, XML_ENTITY_DECL, BAD_CAST "gt",
- NULL, NULL, NULL, NULL, NULL, NULL,
- BAD_CAST ">", BAD_CAST ">", 1,
- XML_INTERNAL_PREDEFINED_ENTITY,
- NULL, NULL, NULL, NULL, 0, 1
- };
- static xmlEntity xmlEntityAmp = {
- NULL, XML_ENTITY_DECL, BAD_CAST "amp",
- NULL, NULL, NULL, NULL, NULL, NULL,
- BAD_CAST "&", BAD_CAST "&", 1,
- XML_INTERNAL_PREDEFINED_ENTITY,
- NULL, NULL, NULL, NULL, 0, 1
- };
- static xmlEntity xmlEntityQuot = {
- NULL, XML_ENTITY_DECL, BAD_CAST "quot",
- NULL, NULL, NULL, NULL, NULL, NULL,
- BAD_CAST "\"", BAD_CAST "\"", 1,
- XML_INTERNAL_PREDEFINED_ENTITY,
- NULL, NULL, NULL, NULL, 0, 1
- };
- static xmlEntity xmlEntityApos = {
- NULL, XML_ENTITY_DECL, BAD_CAST "apos",
- NULL, NULL, NULL, NULL, NULL, NULL,
- BAD_CAST "'", BAD_CAST "'", 1,
- XML_INTERNAL_PREDEFINED_ENTITY,
- NULL, NULL, NULL, NULL, 0, 1
- };
- /**
- * xmlEntitiesErrMemory:
- * @extra: extra information
- *
- * Handle an out of memory condition
- */
- static void
- xmlEntitiesErrMemory(const char *extra)
- {
- __xmlSimpleError(XML_FROM_TREE, XML_ERR_NO_MEMORY, NULL, NULL, extra);
- }
- /**
- * xmlEntitiesErr:
- * @code: the error code
- * @msg: the message
- *
- * Handle an out of memory condition
- */
- static void LIBXML_ATTR_FORMAT(2,0)
- xmlEntitiesErr(xmlParserErrors code, const char *msg)
- {
- __xmlSimpleError(XML_FROM_TREE, code, NULL, msg, NULL);
- }
- /*
- * xmlFreeEntity : clean-up an entity record.
- */
- static void
- xmlFreeEntity(xmlEntityPtr entity)
- {
- xmlDictPtr dict = NULL;
- if (entity == NULL)
- return;
- if (entity->doc != NULL)
- dict = entity->doc->dict;
- if ((entity->children) && (entity->owner == 1) &&
- (entity == (xmlEntityPtr) entity->children->parent))
- xmlFreeNodeList(entity->children);
- if (dict != NULL) {
- if ((entity->name != NULL) && (!xmlDictOwns(dict, entity->name)))
- xmlFree((char *) entity->name);
- if ((entity->ExternalID != NULL) &&
- (!xmlDictOwns(dict, entity->ExternalID)))
- xmlFree((char *) entity->ExternalID);
- if ((entity->SystemID != NULL) &&
- (!xmlDictOwns(dict, entity->SystemID)))
- xmlFree((char *) entity->SystemID);
- if ((entity->URI != NULL) && (!xmlDictOwns(dict, entity->URI)))
- xmlFree((char *) entity->URI);
- if ((entity->content != NULL)
- && (!xmlDictOwns(dict, entity->content)))
- xmlFree((char *) entity->content);
- if ((entity->orig != NULL) && (!xmlDictOwns(dict, entity->orig)))
- xmlFree((char *) entity->orig);
- } else {
- if (entity->name != NULL)
- xmlFree((char *) entity->name);
- if (entity->ExternalID != NULL)
- xmlFree((char *) entity->ExternalID);
- if (entity->SystemID != NULL)
- xmlFree((char *) entity->SystemID);
- if (entity->URI != NULL)
- xmlFree((char *) entity->URI);
- if (entity->content != NULL)
- xmlFree((char *) entity->content);
- if (entity->orig != NULL)
- xmlFree((char *) entity->orig);
- }
- xmlFree(entity);
- }
- /*
- * xmlCreateEntity:
- *
- * internal routine doing the entity node structures allocations
- */
- static xmlEntityPtr
- xmlCreateEntity(xmlDictPtr dict, const xmlChar *name, int type,
- const xmlChar *ExternalID, const xmlChar *SystemID,
- const xmlChar *content) {
- xmlEntityPtr ret;
- ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
- if (ret == NULL) {
- xmlEntitiesErrMemory("xmlCreateEntity: malloc failed");
- return(NULL);
- }
- memset(ret, 0, sizeof(xmlEntity));
- ret->type = XML_ENTITY_DECL;
- ret->checked = 0;
- /*
- * fill the structure.
- */
- ret->etype = (xmlEntityType) type;
- if (dict == NULL) {
- ret->name = xmlStrdup(name);
- if (ExternalID != NULL)
- ret->ExternalID = xmlStrdup(ExternalID);
- if (SystemID != NULL)
- ret->SystemID = xmlStrdup(SystemID);
- } else {
- ret->name = xmlDictLookup(dict, name, -1);
- if (ExternalID != NULL)
- ret->ExternalID = xmlDictLookup(dict, ExternalID, -1);
- if (SystemID != NULL)
- ret->SystemID = xmlDictLookup(dict, SystemID, -1);
- }
- if (content != NULL) {
- ret->length = xmlStrlen(content);
- if ((dict != NULL) && (ret->length < 5))
- ret->content = (xmlChar *)
- xmlDictLookup(dict, content, ret->length);
- else
- ret->content = xmlStrndup(content, ret->length);
- } else {
- ret->length = 0;
- ret->content = NULL;
- }
- ret->URI = NULL; /* to be computed by the layer knowing
- the defining entity */
- ret->orig = NULL;
- ret->owner = 0;
- return(ret);
- }
- /*
- * xmlAddEntity : register a new entity for an entities table.
- */
- static xmlEntityPtr
- xmlAddEntity(xmlDtdPtr dtd, const xmlChar *name, int type,
- const xmlChar *ExternalID, const xmlChar *SystemID,
- const xmlChar *content) {
- xmlDictPtr dict = NULL;
- xmlEntitiesTablePtr table = NULL;
- xmlEntityPtr ret, predef;
- if (name == NULL)
- return(NULL);
- if (dtd == NULL)
- return(NULL);
- if (dtd->doc != NULL)
- dict = dtd->doc->dict;
- switch (type) {
- case XML_INTERNAL_GENERAL_ENTITY:
- case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
- case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
- predef = xmlGetPredefinedEntity(name);
- if (predef != NULL) {
- int valid = 0;
- /* 4.6 Predefined Entities */
- if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
- (content != NULL)) {
- int c = predef->content[0];
- if (((content[0] == c) && (content[1] == 0)) &&
- ((c == '>') || (c == '\'') || (c == '"'))) {
- valid = 1;
- } else if ((content[0] == '&') && (content[1] == '#')) {
- if (content[2] == 'x') {
- xmlChar *hex = BAD_CAST "0123456789ABCDEF";
- xmlChar ref[] = "00;";
- ref[0] = hex[c / 16 % 16];
- ref[1] = hex[c % 16];
- if (xmlStrcasecmp(&content[3], ref) == 0)
- valid = 1;
- } else {
- xmlChar ref[] = "00;";
- ref[0] = '0' + c / 10 % 10;
- ref[1] = '0' + c % 10;
- if (xmlStrEqual(&content[2], ref))
- valid = 1;
- }
- }
- }
- if (!valid) {
- xmlEntitiesErr(XML_ERR_ENTITY_PROCESSING,
- "xmlAddEntity: invalid redeclaration of predefined"
- " entity");
- return(NULL);
- }
- }
- if (dtd->entities == NULL)
- dtd->entities = xmlHashCreateDict(0, dict);
- table = dtd->entities;
- break;
- case XML_INTERNAL_PARAMETER_ENTITY:
- case XML_EXTERNAL_PARAMETER_ENTITY:
- if (dtd->pentities == NULL)
- dtd->pentities = xmlHashCreateDict(0, dict);
- table = dtd->pentities;
- break;
- case XML_INTERNAL_PREDEFINED_ENTITY:
- return(NULL);
- }
- if (table == NULL)
- return(NULL);
- ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
- if (ret == NULL)
- return(NULL);
- ret->doc = dtd->doc;
- if (xmlHashAddEntry(table, name, ret)) {
- /*
- * entity was already defined at another level.
- */
- xmlFreeEntity(ret);
- return(NULL);
- }
- return(ret);
- }
- /**
- * xmlGetPredefinedEntity:
- * @name: the entity name
- *
- * Check whether this name is an predefined entity.
- *
- * Returns NULL if not, otherwise the entity
- */
- xmlEntityPtr
- xmlGetPredefinedEntity(const xmlChar *name) {
- if (name == NULL) return(NULL);
- switch (name[0]) {
- case 'l':
- if (xmlStrEqual(name, BAD_CAST "lt"))
- return(&xmlEntityLt);
- break;
- case 'g':
- if (xmlStrEqual(name, BAD_CAST "gt"))
- return(&xmlEntityGt);
- break;
- case 'a':
- if (xmlStrEqual(name, BAD_CAST "amp"))
- return(&xmlEntityAmp);
- if (xmlStrEqual(name, BAD_CAST "apos"))
- return(&xmlEntityApos);
- break;
- case 'q':
- if (xmlStrEqual(name, BAD_CAST "quot"))
- return(&xmlEntityQuot);
- break;
- default:
- break;
- }
- return(NULL);
- }
- /**
- * xmlAddDtdEntity:
- * @doc: the document
- * @name: the entity name
- * @type: the entity type XML_xxx_yyy_ENTITY
- * @ExternalID: the entity external ID if available
- * @SystemID: the entity system ID if available
- * @content: the entity content
- *
- * Register a new entity for this document DTD external subset.
- *
- * Returns a pointer to the entity or NULL in case of error
- */
- xmlEntityPtr
- xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
- const xmlChar *ExternalID, const xmlChar *SystemID,
- const xmlChar *content) {
- xmlEntityPtr ret;
- xmlDtdPtr dtd;
- if (doc == NULL) {
- xmlEntitiesErr(XML_DTD_NO_DOC,
- "xmlAddDtdEntity: document is NULL");
- return(NULL);
- }
- if (doc->extSubset == NULL) {
- xmlEntitiesErr(XML_DTD_NO_DTD,
- "xmlAddDtdEntity: document without external subset");
- return(NULL);
- }
- dtd = doc->extSubset;
- ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
- if (ret == NULL) return(NULL);
- /*
- * Link it to the DTD
- */
- ret->parent = dtd;
- ret->doc = dtd->doc;
- if (dtd->last == NULL) {
- dtd->children = dtd->last = (xmlNodePtr) ret;
- } else {
- dtd->last->next = (xmlNodePtr) ret;
- ret->prev = dtd->last;
- dtd->last = (xmlNodePtr) ret;
- }
- return(ret);
- }
- /**
- * xmlAddDocEntity:
- * @doc: the document
- * @name: the entity name
- * @type: the entity type XML_xxx_yyy_ENTITY
- * @ExternalID: the entity external ID if available
- * @SystemID: the entity system ID if available
- * @content: the entity content
- *
- * Register a new entity for this document.
- *
- * Returns a pointer to the entity or NULL in case of error
- */
- xmlEntityPtr
- xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
- const xmlChar *ExternalID, const xmlChar *SystemID,
- const xmlChar *content) {
- xmlEntityPtr ret;
- xmlDtdPtr dtd;
- if (doc == NULL) {
- xmlEntitiesErr(XML_DTD_NO_DOC,
- "xmlAddDocEntity: document is NULL");
- return(NULL);
- }
- if (doc->intSubset == NULL) {
- xmlEntitiesErr(XML_DTD_NO_DTD,
- "xmlAddDocEntity: document without internal subset");
- return(NULL);
- }
- dtd = doc->intSubset;
- ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
- if (ret == NULL) return(NULL);
- /*
- * Link it to the DTD
- */
- ret->parent = dtd;
- ret->doc = dtd->doc;
- if (dtd->last == NULL) {
- dtd->children = dtd->last = (xmlNodePtr) ret;
- } else {
- dtd->last->next = (xmlNodePtr) ret;
- ret->prev = dtd->last;
- dtd->last = (xmlNodePtr) ret;
- }
- return(ret);
- }
- /**
- * xmlNewEntity:
- * @doc: the document
- * @name: the entity name
- * @type: the entity type XML_xxx_yyy_ENTITY
- * @ExternalID: the entity external ID if available
- * @SystemID: the entity system ID if available
- * @content: the entity content
- *
- * Create a new entity, this differs from xmlAddDocEntity() that if
- * the document is NULL or has no internal subset defined, then an
- * unlinked entity structure will be returned, it is then the responsibility
- * of the caller to link it to the document later or free it when not needed
- * anymore.
- *
- * Returns a pointer to the entity or NULL in case of error
- */
- xmlEntityPtr
- xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
- const xmlChar *ExternalID, const xmlChar *SystemID,
- const xmlChar *content) {
- xmlEntityPtr ret;
- xmlDictPtr dict;
- if ((doc != NULL) && (doc->intSubset != NULL)) {
- return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
- }
- if (doc != NULL)
- dict = doc->dict;
- else
- dict = NULL;
- ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
- if (ret == NULL)
- return(NULL);
- ret->doc = doc;
- return(ret);
- }
- /**
- * xmlGetEntityFromTable:
- * @table: an entity table
- * @name: the entity name
- * @parameter: look for parameter entities
- *
- * Do an entity lookup in the table.
- * returns the corresponding parameter entity, if found.
- *
- * Returns A pointer to the entity structure or NULL if not found.
- */
- static xmlEntityPtr
- xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
- return((xmlEntityPtr) xmlHashLookup(table, name));
- }
- /**
- * xmlGetParameterEntity:
- * @doc: the document referencing the entity
- * @name: the entity name
- *
- * Do an entity lookup in the internal and external subsets and
- * returns the corresponding parameter entity, if found.
- *
- * Returns A pointer to the entity structure or NULL if not found.
- */
- xmlEntityPtr
- xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
- xmlEntitiesTablePtr table;
- xmlEntityPtr ret;
- if (doc == NULL)
- return(NULL);
- if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
- table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
- ret = xmlGetEntityFromTable(table, name);
- if (ret != NULL)
- return(ret);
- }
- if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
- table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
- return(xmlGetEntityFromTable(table, name));
- }
- return(NULL);
- }
- /**
- * xmlGetDtdEntity:
- * @doc: the document referencing the entity
- * @name: the entity name
- *
- * Do an entity lookup in the DTD entity hash table and
- * returns the corresponding entity, if found.
- * Note: the first argument is the document node, not the DTD node.
- *
- * Returns A pointer to the entity structure or NULL if not found.
- */
- xmlEntityPtr
- xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
- xmlEntitiesTablePtr table;
- if (doc == NULL)
- return(NULL);
- if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
- table = (xmlEntitiesTablePtr) doc->extSubset->entities;
- return(xmlGetEntityFromTable(table, name));
- }
- return(NULL);
- }
- /**
- * xmlGetDocEntity:
- * @doc: the document referencing the entity
- * @name: the entity name
- *
- * Do an entity lookup in the document entity hash table and
- * returns the corresponding entity, otherwise a lookup is done
- * in the predefined entities too.
- *
- * Returns A pointer to the entity structure or NULL if not found.
- */
- xmlEntityPtr
- xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
- xmlEntityPtr cur;
- xmlEntitiesTablePtr table;
- if (doc != NULL) {
- if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
- table = (xmlEntitiesTablePtr) doc->intSubset->entities;
- cur = xmlGetEntityFromTable(table, name);
- if (cur != NULL)
- return(cur);
- }
- if (doc->standalone != 1) {
- if ((doc->extSubset != NULL) &&
- (doc->extSubset->entities != NULL)) {
- table = (xmlEntitiesTablePtr) doc->extSubset->entities;
- cur = xmlGetEntityFromTable(table, name);
- if (cur != NULL)
- return(cur);
- }
- }
- }
- return(xmlGetPredefinedEntity(name));
- }
- /*
- * Macro used to grow the current buffer.
- */
- #define growBufferReentrant() { \
- xmlChar *tmp; \
- size_t new_size = buffer_size * 2; \
- if (new_size < buffer_size) goto mem_error; \
- tmp = (xmlChar *) xmlRealloc(buffer, new_size); \
- if (tmp == NULL) goto mem_error; \
- buffer = tmp; \
- buffer_size = new_size; \
- }
- /**
- * xmlEncodeEntitiesInternal:
- * @doc: the document containing the string
- * @input: A string to convert to XML.
- * @attr: are we handling an attribute value
- *
- * Do a global encoding of a string, replacing the predefined entities
- * and non ASCII values with their entities and CharRef counterparts.
- * Contrary to xmlEncodeEntities, this routine is reentrant, and result
- * must be deallocated.
- *
- * Returns A newly allocated string with the substitution done.
- */
- static xmlChar *
- xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input, int attr) {
- const xmlChar *cur = input;
- xmlChar *buffer = NULL;
- xmlChar *out = NULL;
- size_t buffer_size = 0;
- int html = 0;
- if (input == NULL) return(NULL);
- if (doc != NULL)
- html = (doc->type == XML_HTML_DOCUMENT_NODE);
- /*
- * allocate an translation buffer.
- */
- buffer_size = 1000;
- buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
- if (buffer == NULL) {
- xmlEntitiesErrMemory("xmlEncodeEntities: malloc failed");
- return(NULL);
- }
- out = buffer;
- while (*cur != '\0') {
- size_t indx = out - buffer;
- if (indx + 100 > buffer_size) {
- growBufferReentrant();
- out = &buffer[indx];
- }
- /*
- * By default one have to encode at least '<', '>', '"' and '&' !
- */
- if (*cur == '<') {
- const xmlChar *end;
- /*
- * Special handling of server side include in HTML attributes
- */
- if (html && attr &&
- (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
- ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
- while (cur != end) {
- *out++ = *cur++;
- indx = out - buffer;
- if (indx + 100 > buffer_size) {
- growBufferReentrant();
- out = &buffer[indx];
- }
- }
- *out++ = *cur++;
- *out++ = *cur++;
- *out++ = *cur++;
- continue;
- }
- *out++ = '&';
- *out++ = 'l';
- *out++ = 't';
- *out++ = ';';
- } else if (*cur == '>') {
- *out++ = '&';
- *out++ = 'g';
- *out++ = 't';
- *out++ = ';';
- } else if (*cur == '&') {
- /*
- * Special handling of &{...} construct from HTML 4, see
- * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
- */
- if (html && attr && (cur[1] == '{') &&
- (strchr((const char *) cur, '}'))) {
- while (*cur != '}') {
- *out++ = *cur++;
- indx = out - buffer;
- if (indx + 100 > buffer_size) {
- growBufferReentrant();
- out = &buffer[indx];
- }
- }
- *out++ = *cur++;
- continue;
- }
- *out++ = '&';
- *out++ = 'a';
- *out++ = 'm';
- *out++ = 'p';
- *out++ = ';';
- } else if (((*cur >= 0x20) && (*cur < 0x80)) ||
- (*cur == '\n') || (*cur == '\t') || ((html) && (*cur == '\r'))) {
- /*
- * default case, just copy !
- */
- *out++ = *cur;
- } else if (*cur >= 0x80) {
- if (((doc != NULL) && (doc->encoding != NULL)) || (html)) {
- /*
- * Bjørn Reese <br@sseusa.com> provided the patch
- xmlChar xc;
- xc = (*cur & 0x3F) << 6;
- if (cur[1] != 0) {
- xc += *(++cur) & 0x3F;
- *out++ = xc;
- } else
- */
- *out++ = *cur;
- } else {
- /*
- * We assume we have UTF-8 input.
- * It must match either:
- * 110xxxxx 10xxxxxx
- * 1110xxxx 10xxxxxx 10xxxxxx
- * 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
- * That is:
- * cur[0] is 11xxxxxx
- * cur[1] is 10xxxxxx
- * cur[2] is 10xxxxxx if cur[0] is 111xxxxx
- * cur[3] is 10xxxxxx if cur[0] is 1111xxxx
- * cur[0] is not 11111xxx
- */
- char buf[11], *ptr;
- int val = 0, l = 1;
- if (((cur[0] & 0xC0) != 0xC0) ||
- ((cur[1] & 0xC0) != 0x80) ||
- (((cur[0] & 0xE0) == 0xE0) && ((cur[2] & 0xC0) != 0x80)) ||
- (((cur[0] & 0xF0) == 0xF0) && ((cur[3] & 0xC0) != 0x80)) ||
- (((cur[0] & 0xF8) == 0xF8))) {
- xmlEntitiesErr(XML_CHECK_NOT_UTF8,
- "xmlEncodeEntities: input not UTF-8");
- if (doc != NULL)
- doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
- snprintf(buf, sizeof(buf), "&#%d;", *cur);
- buf[sizeof(buf) - 1] = 0;
- ptr = buf;
- while (*ptr != 0) *out++ = *ptr++;
- cur++;
- continue;
- } else if (*cur < 0xE0) {
- val = (cur[0]) & 0x1F;
- val <<= 6;
- val |= (cur[1]) & 0x3F;
- l = 2;
- } else if (*cur < 0xF0) {
- val = (cur[0]) & 0x0F;
- val <<= 6;
- val |= (cur[1]) & 0x3F;
- val <<= 6;
- val |= (cur[2]) & 0x3F;
- l = 3;
- } else if (*cur < 0xF8) {
- val = (cur[0]) & 0x07;
- val <<= 6;
- val |= (cur[1]) & 0x3F;
- val <<= 6;
- val |= (cur[2]) & 0x3F;
- val <<= 6;
- val |= (cur[3]) & 0x3F;
- l = 4;
- }
- if ((l == 1) || (!IS_CHAR(val))) {
- xmlEntitiesErr(XML_ERR_INVALID_CHAR,
- "xmlEncodeEntities: char out of range\n");
- if (doc != NULL)
- doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
- snprintf(buf, sizeof(buf), "&#%d;", *cur);
- buf[sizeof(buf) - 1] = 0;
- ptr = buf;
- while (*ptr != 0) *out++ = *ptr++;
- cur++;
- continue;
- }
- /*
- * We could do multiple things here. Just save as a char ref
- */
- snprintf(buf, sizeof(buf), "&#x%X;", val);
- buf[sizeof(buf) - 1] = 0;
- ptr = buf;
- while (*ptr != 0) *out++ = *ptr++;
- cur += l;
- continue;
- }
- } else if (IS_BYTE_CHAR(*cur)) {
- char buf[11], *ptr;
- snprintf(buf, sizeof(buf), "&#%d;", *cur);
- buf[sizeof(buf) - 1] = 0;
- ptr = buf;
- while (*ptr != 0) *out++ = *ptr++;
- }
- cur++;
- }
- *out = 0;
- return(buffer);
- mem_error:
- xmlEntitiesErrMemory("xmlEncodeEntities: realloc failed");
- xmlFree(buffer);
- return(NULL);
- }
- /**
- * xmlEncodeAttributeEntities:
- * @doc: the document containing the string
- * @input: A string to convert to XML.
- *
- * Do a global encoding of a string, replacing the predefined entities
- * and non ASCII values with their entities and CharRef counterparts for
- * attribute values.
- *
- * Returns A newly allocated string with the substitution done.
- */
- xmlChar *
- xmlEncodeAttributeEntities(xmlDocPtr doc, const xmlChar *input) {
- return xmlEncodeEntitiesInternal(doc, input, 1);
- }
- /**
- * xmlEncodeEntitiesReentrant:
- * @doc: the document containing the string
- * @input: A string to convert to XML.
- *
- * Do a global encoding of a string, replacing the predefined entities
- * and non ASCII values with their entities and CharRef counterparts.
- * Contrary to xmlEncodeEntities, this routine is reentrant, and result
- * must be deallocated.
- *
- * Returns A newly allocated string with the substitution done.
- */
- xmlChar *
- xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
- return xmlEncodeEntitiesInternal(doc, input, 0);
- }
- /**
- * xmlEncodeSpecialChars:
- * @doc: the document containing the string
- * @input: A string to convert to XML.
- *
- * Do a global encoding of a string, replacing the predefined entities
- * this routine is reentrant, and result must be deallocated.
- *
- * Returns A newly allocated string with the substitution done.
- */
- xmlChar *
- xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED, const xmlChar *input) {
- const xmlChar *cur = input;
- xmlChar *buffer = NULL;
- xmlChar *out = NULL;
- size_t buffer_size = 0;
- if (input == NULL) return(NULL);
- /*
- * allocate an translation buffer.
- */
- buffer_size = 1000;
- buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
- if (buffer == NULL) {
- xmlEntitiesErrMemory("xmlEncodeSpecialChars: malloc failed");
- return(NULL);
- }
- out = buffer;
- while (*cur != '\0') {
- size_t indx = out - buffer;
- if (indx + 10 > buffer_size) {
- growBufferReentrant();
- out = &buffer[indx];
- }
- /*
- * By default one have to encode at least '<', '>', '"' and '&' !
- */
- if (*cur == '<') {
- *out++ = '&';
- *out++ = 'l';
- *out++ = 't';
- *out++ = ';';
- } else if (*cur == '>') {
- *out++ = '&';
- *out++ = 'g';
- *out++ = 't';
- *out++ = ';';
- } else if (*cur == '&') {
- *out++ = '&';
- *out++ = 'a';
- *out++ = 'm';
- *out++ = 'p';
- *out++ = ';';
- } else if (*cur == '"') {
- *out++ = '&';
- *out++ = 'q';
- *out++ = 'u';
- *out++ = 'o';
- *out++ = 't';
- *out++ = ';';
- } else if (*cur == '\r') {
- *out++ = '&';
- *out++ = '#';
- *out++ = '1';
- *out++ = '3';
- *out++ = ';';
- } else {
- /*
- * Works because on UTF-8, all extended sequences cannot
- * result in bytes in the ASCII range.
- */
- *out++ = *cur;
- }
- cur++;
- }
- *out = 0;
- return(buffer);
- mem_error:
- xmlEntitiesErrMemory("xmlEncodeSpecialChars: realloc failed");
- xmlFree(buffer);
- return(NULL);
- }
- /**
- * xmlCreateEntitiesTable:
- *
- * create and initialize an empty entities hash table.
- * This really doesn't make sense and should be deprecated
- *
- * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
- */
- xmlEntitiesTablePtr
- xmlCreateEntitiesTable(void) {
- return((xmlEntitiesTablePtr) xmlHashCreate(0));
- }
- /**
- * xmlFreeEntityWrapper:
- * @entity: An entity
- * @name: its name
- *
- * Deallocate the memory used by an entities in the hash table.
- */
- static void
- xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
- if (entity != NULL)
- xmlFreeEntity((xmlEntityPtr) entity);
- }
- /**
- * xmlFreeEntitiesTable:
- * @table: An entity table
- *
- * Deallocate the memory used by an entities hash table.
- */
- void
- xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
- xmlHashFree(table, xmlFreeEntityWrapper);
- }
- #ifdef LIBXML_TREE_ENABLED
- /**
- * xmlCopyEntity:
- * @ent: An entity
- *
- * Build a copy of an entity
- *
- * Returns the new xmlEntitiesPtr or NULL in case of error.
- */
- static void *
- xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
- xmlEntityPtr ent = (xmlEntityPtr) payload;
- xmlEntityPtr cur;
- cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
- if (cur == NULL) {
- xmlEntitiesErrMemory("xmlCopyEntity:: malloc failed");
- return(NULL);
- }
- memset(cur, 0, sizeof(xmlEntity));
- cur->type = XML_ENTITY_DECL;
- cur->etype = ent->etype;
- if (ent->name != NULL)
- cur->name = xmlStrdup(ent->name);
- if (ent->ExternalID != NULL)
- cur->ExternalID = xmlStrdup(ent->ExternalID);
- if (ent->SystemID != NULL)
- cur->SystemID = xmlStrdup(ent->SystemID);
- if (ent->content != NULL)
- cur->content = xmlStrdup(ent->content);
- if (ent->orig != NULL)
- cur->orig = xmlStrdup(ent->orig);
- if (ent->URI != NULL)
- cur->URI = xmlStrdup(ent->URI);
- return(cur);
- }
- /**
- * xmlCopyEntitiesTable:
- * @table: An entity table
- *
- * Build a copy of an entity table.
- *
- * Returns the new xmlEntitiesTablePtr or NULL in case of error.
- */
- xmlEntitiesTablePtr
- xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
- return(xmlHashCopy(table, xmlCopyEntity));
- }
- #endif /* LIBXML_TREE_ENABLED */
- #ifdef LIBXML_OUTPUT_ENABLED
- /**
- * xmlDumpEntityContent:
- * @buf: An XML buffer.
- * @content: The entity content.
- *
- * This will dump the quoted string value, taking care of the special
- * treatment required by %
- */
- static void
- xmlDumpEntityContent(xmlBufferPtr buf, const xmlChar *content) {
- if (buf->alloc == XML_BUFFER_ALLOC_IMMUTABLE) return;
- if (xmlStrchr(content, '%')) {
- const xmlChar * base, *cur;
- xmlBufferCCat(buf, "\"");
- base = cur = content;
- while (*cur != 0) {
- if (*cur == '"') {
- if (base != cur)
- xmlBufferAdd(buf, base, cur - base);
- xmlBufferAdd(buf, BAD_CAST """, 6);
- cur++;
- base = cur;
- } else if (*cur == '%') {
- if (base != cur)
- xmlBufferAdd(buf, base, cur - base);
- xmlBufferAdd(buf, BAD_CAST "%", 6);
- cur++;
- base = cur;
- } else {
- cur++;
- }
- }
- if (base != cur)
- xmlBufferAdd(buf, base, cur - base);
- xmlBufferCCat(buf, "\"");
- } else {
- xmlBufferWriteQuotedString(buf, content);
- }
- }
- /**
- * xmlDumpEntityDecl:
- * @buf: An XML buffer.
- * @ent: An entity table
- *
- * This will dump the content of the entity table as an XML DTD definition
- */
- void
- xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
- if ((buf == NULL) || (ent == NULL)) return;
- switch (ent->etype) {
- case XML_INTERNAL_GENERAL_ENTITY:
- xmlBufferWriteChar(buf, "<!ENTITY ");
- xmlBufferWriteCHAR(buf, ent->name);
- xmlBufferWriteChar(buf, " ");
- if (ent->orig != NULL)
- xmlBufferWriteQuotedString(buf, ent->orig);
- else
- xmlDumpEntityContent(buf, ent->content);
- xmlBufferWriteChar(buf, ">\n");
- break;
- case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
- xmlBufferWriteChar(buf, "<!ENTITY ");
- xmlBufferWriteCHAR(buf, ent->name);
- if (ent->ExternalID != NULL) {
- xmlBufferWriteChar(buf, " PUBLIC ");
- xmlBufferWriteQuotedString(buf, ent->ExternalID);
- xmlBufferWriteChar(buf, " ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- } else {
- xmlBufferWriteChar(buf, " SYSTEM ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- }
- xmlBufferWriteChar(buf, ">\n");
- break;
- case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
- xmlBufferWriteChar(buf, "<!ENTITY ");
- xmlBufferWriteCHAR(buf, ent->name);
- if (ent->ExternalID != NULL) {
- xmlBufferWriteChar(buf, " PUBLIC ");
- xmlBufferWriteQuotedString(buf, ent->ExternalID);
- xmlBufferWriteChar(buf, " ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- } else {
- xmlBufferWriteChar(buf, " SYSTEM ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- }
- if (ent->content != NULL) { /* Should be true ! */
- xmlBufferWriteChar(buf, " NDATA ");
- if (ent->orig != NULL)
- xmlBufferWriteCHAR(buf, ent->orig);
- else
- xmlBufferWriteCHAR(buf, ent->content);
- }
- xmlBufferWriteChar(buf, ">\n");
- break;
- case XML_INTERNAL_PARAMETER_ENTITY:
- xmlBufferWriteChar(buf, "<!ENTITY % ");
- xmlBufferWriteCHAR(buf, ent->name);
- xmlBufferWriteChar(buf, " ");
- if (ent->orig == NULL)
- xmlDumpEntityContent(buf, ent->content);
- else
- xmlBufferWriteQuotedString(buf, ent->orig);
- xmlBufferWriteChar(buf, ">\n");
- break;
- case XML_EXTERNAL_PARAMETER_ENTITY:
- xmlBufferWriteChar(buf, "<!ENTITY % ");
- xmlBufferWriteCHAR(buf, ent->name);
- if (ent->ExternalID != NULL) {
- xmlBufferWriteChar(buf, " PUBLIC ");
- xmlBufferWriteQuotedString(buf, ent->ExternalID);
- xmlBufferWriteChar(buf, " ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- } else {
- xmlBufferWriteChar(buf, " SYSTEM ");
- xmlBufferWriteQuotedString(buf, ent->SystemID);
- }
- xmlBufferWriteChar(buf, ">\n");
- break;
- default:
- xmlEntitiesErr(XML_DTD_UNKNOWN_ENTITY,
- "xmlDumpEntitiesDecl: internal: unknown type entity type");
- }
- }
- /**
- * xmlDumpEntityDeclScan:
- * @ent: An entity table
- * @buf: An XML buffer.
- *
- * When using the hash table scan function, arguments need to be reversed
- */
- static void
- xmlDumpEntityDeclScan(void *ent, void *buf,
- const xmlChar *name ATTRIBUTE_UNUSED) {
- xmlDumpEntityDecl((xmlBufferPtr) buf, (xmlEntityPtr) ent);
- }
- /**
- * xmlDumpEntitiesTable:
- * @buf: An XML buffer.
- * @table: An entity table
- *
- * This will dump the content of the entity table as an XML DTD definition
- */
- void
- xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
- xmlHashScan(table, xmlDumpEntityDeclScan, buf);
- }
- #endif /* LIBXML_OUTPUT_ENABLED */
- #define bottom_entities
- #include "elfgcchack.h"
|