1
0
mirror of https://gitlab.gnome.org/GNOME/libxml2.git synced 2025-01-12 09:17:37 +03:00
libxml2/entities.c

969 lines
25 KiB
C
Raw Normal View History

2001-02-23 20:55:21 +03:00
/*
* entities.c : implementation for the XML entities handling
2001-02-23 20:55:21 +03:00
*
* See Copyright for the status of this software.
*
* daniel@veillard.com
2001-02-23 20:55:21 +03:00
*/
/* To avoid EBCDIC trouble when parsing on zOS */
#if defined(__MVS__)
#pragma convert("ISO8859-1")
#endif
#define IN_LIBXML
2001-04-21 20:57:29 +04:00
#include "libxml.h"
2001-02-23 20:55:21 +03:00
#include <string.h>
#include <stdlib.h>
2001-02-23 20:55:21 +03:00
#include <libxml/xmlmemory.h>
#include <libxml/hash.h>
#include <libxml/entities.h>
#include <libxml/parser.h>
#include <libxml/parserInternals.h>
2001-02-23 20:55:21 +03:00
#include <libxml/xmlerror.h>
#include <libxml/dict.h>
#include <libxml/xmlsave.h>
2001-02-23 20:55:21 +03:00
#include "private/entities.h"
#include "private/error.h"
2001-02-23 20:55:21 +03:00
/*
* The XML predefined entities.
*/
static xmlEntity xmlEntityLt = {
NULL, XML_ENTITY_DECL, BAD_CAST "lt",
NULL, NULL, NULL, NULL, NULL, NULL,
BAD_CAST "<", BAD_CAST "<", 1,
XML_INTERNAL_PREDEFINED_ENTITY,
NULL, NULL, NULL, NULL, 0, 0, 0
2001-02-23 20:55:21 +03:00
};
static xmlEntity xmlEntityGt = {
NULL, XML_ENTITY_DECL, BAD_CAST "gt",
NULL, NULL, NULL, NULL, NULL, NULL,
BAD_CAST ">", BAD_CAST ">", 1,
XML_INTERNAL_PREDEFINED_ENTITY,
NULL, NULL, NULL, NULL, 0, 0, 0
};
static xmlEntity xmlEntityAmp = {
NULL, XML_ENTITY_DECL, BAD_CAST "amp",
NULL, NULL, NULL, NULL, NULL, NULL,
BAD_CAST "&", BAD_CAST "&", 1,
XML_INTERNAL_PREDEFINED_ENTITY,
NULL, NULL, NULL, NULL, 0, 0, 0
};
static xmlEntity xmlEntityQuot = {
NULL, XML_ENTITY_DECL, BAD_CAST "quot",
NULL, NULL, NULL, NULL, NULL, NULL,
BAD_CAST "\"", BAD_CAST "\"", 1,
XML_INTERNAL_PREDEFINED_ENTITY,
NULL, NULL, NULL, NULL, 0, 0, 0
};
static xmlEntity xmlEntityApos = {
NULL, XML_ENTITY_DECL, BAD_CAST "apos",
NULL, NULL, NULL, NULL, NULL, NULL,
BAD_CAST "'", BAD_CAST "'", 1,
XML_INTERNAL_PREDEFINED_ENTITY,
NULL, NULL, NULL, NULL, 0, 0, 0
2001-02-23 20:55:21 +03:00
};
/*
2024-05-20 14:58:22 +03:00
* xmlFreeEntity:
* @entity: an entity
*
* Frees the entity.
2001-02-23 20:55:21 +03:00
*/
2023-10-06 11:43:38 +03:00
void
xmlFreeEntity(xmlEntityPtr entity)
{
xmlDictPtr dict = NULL;
if (entity == NULL)
return;
if (entity->doc != NULL)
dict = entity->doc->dict;
2001-02-23 20:55:21 +03:00
if ((entity->children) &&
(entity == (xmlEntityPtr) entity->children->parent))
xmlFreeNodeList(entity->children);
if ((entity->name != NULL) &&
((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
xmlFree((char *) entity->name);
if (entity->ExternalID != NULL)
xmlFree((char *) entity->ExternalID);
if (entity->SystemID != NULL)
xmlFree((char *) entity->SystemID);
if (entity->URI != NULL)
xmlFree((char *) entity->URI);
if (entity->content != NULL)
xmlFree((char *) entity->content);
if (entity->orig != NULL)
xmlFree((char *) entity->orig);
2001-02-23 20:55:21 +03:00
xmlFree(entity);
}
/*
* xmlCreateEntity:
*
2019-09-30 18:04:54 +03:00
* internal routine doing the entity node structures allocations
2001-02-23 20:55:21 +03:00
*/
static xmlEntityPtr
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
const xmlChar *ExternalID, const xmlChar *SystemID,
const xmlChar *content) {
2001-02-23 20:55:21 +03:00
xmlEntityPtr ret;
ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
if (ret == NULL)
2001-02-23 20:55:21 +03:00
return(NULL);
memset(ret, 0, sizeof(xmlEntity));
ret->doc = doc;
2001-02-23 20:55:21 +03:00
ret->type = XML_ENTITY_DECL;
/*
* fill the structure.
*/
ret->etype = (xmlEntityType) type;
if ((doc == NULL) || (doc->dict == NULL))
ret->name = xmlStrdup(name);
else
ret->name = xmlDictLookup(doc->dict, name, -1);
if (ret->name == NULL)
goto error;
if (ExternalID != NULL) {
ret->ExternalID = xmlStrdup(ExternalID);
if (ret->ExternalID == NULL)
goto error;
}
if (SystemID != NULL) {
ret->SystemID = xmlStrdup(SystemID);
if (ret->SystemID == NULL)
goto error;
}
2001-02-23 20:55:21 +03:00
if (content != NULL) {
ret->length = xmlStrlen(content);
ret->content = xmlStrndup(content, ret->length);
if (ret->content == NULL)
goto error;
2001-02-23 20:55:21 +03:00
} else {
ret->length = 0;
ret->content = NULL;
}
ret->URI = NULL; /* to be computed by the layer knowing
the defining entity */
ret->orig = NULL;
return(ret);
error:
xmlFreeEntity(ret);
return(NULL);
}
/**
* xmlAddEntity:
* @doc: the document
* @extSubset: add to the external or internal subset
* @name: the entity name
* @type: the entity type XML_xxx_yyy_ENTITY
* @ExternalID: the entity external ID if available
* @SystemID: the entity system ID if available
* @content: the entity content
* @out: pointer to resulting entity (optional)
*
* Register a new entity for this document.
*
2024-05-20 14:58:22 +03:00
* Available since 2.13.0.
*
* Returns an xmlParserErrors error code.
*/
int
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
const xmlChar *ExternalID, const xmlChar *SystemID,
const xmlChar *content, xmlEntityPtr *out) {
xmlDtdPtr dtd;
xmlDictPtr dict = NULL;
xmlEntitiesTablePtr table = NULL;
xmlEntityPtr ret, predef;
int res;
if (out != NULL)
*out = NULL;
if ((doc == NULL) || (name == NULL))
return(XML_ERR_ARGUMENT);
dict = doc->dict;
if (extSubset)
dtd = doc->extSubset;
else
dtd = doc->intSubset;
if (dtd == NULL)
return(XML_DTD_NO_DTD);
switch (type) {
case XML_INTERNAL_GENERAL_ENTITY:
case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
predef = xmlGetPredefinedEntity(name);
if (predef != NULL) {
int valid = 0;
/* 4.6 Predefined Entities */
if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
(content != NULL)) {
int c = predef->content[0];
if (((content[0] == c) && (content[1] == 0)) &&
((c == '>') || (c == '\'') || (c == '"'))) {
valid = 1;
} else if ((content[0] == '&') && (content[1] == '#')) {
if (content[2] == 'x') {
xmlChar *hex = BAD_CAST "0123456789ABCDEF";
xmlChar ref[] = "00;";
ref[0] = hex[c / 16 % 16];
ref[1] = hex[c % 16];
if (xmlStrcasecmp(&content[3], ref) == 0)
valid = 1;
} else {
xmlChar ref[] = "00;";
ref[0] = '0' + c / 10 % 10;
ref[1] = '0' + c % 10;
if (xmlStrEqual(&content[2], ref))
valid = 1;
}
}
}
if (!valid)
return(XML_ERR_REDECL_PREDEF_ENTITY);
}
if (dtd->entities == NULL) {
dtd->entities = xmlHashCreateDict(0, dict);
if (dtd->entities == NULL)
return(XML_ERR_NO_MEMORY);
}
table = dtd->entities;
break;
case XML_INTERNAL_PARAMETER_ENTITY:
case XML_EXTERNAL_PARAMETER_ENTITY:
if (dtd->pentities == NULL) {
dtd->pentities = xmlHashCreateDict(0, dict);
if (dtd->pentities == NULL)
return(XML_ERR_NO_MEMORY);
}
table = dtd->pentities;
break;
default:
return(XML_ERR_ARGUMENT);
}
ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
if (ret == NULL)
return(XML_ERR_NO_MEMORY);
2001-02-23 20:55:21 +03:00
res = xmlHashAdd(table, name, ret);
if (res < 0) {
xmlFreeEntity(ret);
return(XML_ERR_NO_MEMORY);
} else if (res == 0) {
2001-02-23 20:55:21 +03:00
/*
* entity was already defined at another level.
*/
xmlFreeEntity(ret);
return(XML_WAR_ENTITY_REDEFINED);
2001-02-23 20:55:21 +03:00
}
/*
* Link it to the DTD
*/
ret->parent = dtd;
ret->doc = dtd->doc;
if (dtd->last == NULL) {
dtd->children = dtd->last = (xmlNodePtr) ret;
} else {
dtd->last->next = (xmlNodePtr) ret;
ret->prev = dtd->last;
dtd->last = (xmlNodePtr) ret;
}
if (out != NULL)
*out = ret;
return(0);
2001-02-23 20:55:21 +03:00
}
/**
* xmlGetPredefinedEntity:
* @name: the entity name
*
* Check whether this name is an predefined entity.
*
* Returns NULL if not, otherwise the entity
2001-02-23 20:55:21 +03:00
*/
xmlEntityPtr
xmlGetPredefinedEntity(const xmlChar *name) {
if (name == NULL) return(NULL);
switch (name[0]) {
case 'l':
if (xmlStrEqual(name, BAD_CAST "lt"))
return(&xmlEntityLt);
break;
case 'g':
if (xmlStrEqual(name, BAD_CAST "gt"))
return(&xmlEntityGt);
break;
case 'a':
if (xmlStrEqual(name, BAD_CAST "amp"))
return(&xmlEntityAmp);
if (xmlStrEqual(name, BAD_CAST "apos"))
return(&xmlEntityApos);
break;
case 'q':
if (xmlStrEqual(name, BAD_CAST "quot"))
return(&xmlEntityQuot);
break;
default:
break;
}
return(NULL);
2001-02-23 20:55:21 +03:00
}
/**
* xmlAddDtdEntity:
* @doc: the document
* @name: the entity name
* @type: the entity type XML_xxx_yyy_ENTITY
* @ExternalID: the entity external ID if available
* @SystemID: the entity system ID if available
* @content: the entity content
*
* Register a new entity for this document DTD external subset.
*
* Returns a pointer to the entity or NULL in case of error
*/
xmlEntityPtr
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
const xmlChar *ExternalID, const xmlChar *SystemID,
const xmlChar *content) {
xmlEntityPtr ret;
xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
2001-02-23 20:55:21 +03:00
return(ret);
}
/**
* xmlAddDocEntity:
* @doc: the document
* @name: the entity name
* @type: the entity type XML_xxx_yyy_ENTITY
* @ExternalID: the entity external ID if available
* @SystemID: the entity system ID if available
* @content: the entity content
*
* Register a new entity for this document.
*
* Returns a pointer to the entity or NULL in case of error
*/
xmlEntityPtr
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
const xmlChar *ExternalID, const xmlChar *SystemID,
const xmlChar *content) {
xmlEntityPtr ret;
xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
2001-02-23 20:55:21 +03:00
return(ret);
}
/**
* xmlNewEntity:
* @doc: the document
* @name: the entity name
* @type: the entity type XML_xxx_yyy_ENTITY
* @ExternalID: the entity external ID if available
* @SystemID: the entity system ID if available
* @content: the entity content
*
* Create a new entity, this differs from xmlAddDocEntity() that if
* the document is NULL or has no internal subset defined, then an
2019-09-30 18:04:54 +03:00
* unlinked entity structure will be returned, it is then the responsibility
* of the caller to link it to the document later or free it when not needed
* anymore.
*
* Returns a pointer to the entity or NULL in case of error
*/
xmlEntityPtr
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
const xmlChar *ExternalID, const xmlChar *SystemID,
const xmlChar *content) {
if ((doc != NULL) && (doc->intSubset != NULL)) {
return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
}
if (name == NULL)
return(NULL);
return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
}
2001-02-23 20:55:21 +03:00
/**
* xmlGetEntityFromTable:
* @table: an entity table
* @name: the entity name
* @parameter: look for parameter entities
*
* Do an entity lookup in the table.
* returns the corresponding parameter entity, if found.
*
2001-02-23 20:55:21 +03:00
* Returns A pointer to the entity structure or NULL if not found.
*/
static xmlEntityPtr
2001-02-23 20:55:21 +03:00
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
return((xmlEntityPtr) xmlHashLookup(table, name));
}
/**
* xmlGetParameterEntity:
* @doc: the document referencing the entity
* @name: the entity name
*
* Do an entity lookup in the internal and external subsets and
* returns the corresponding parameter entity, if found.
*
2001-02-23 20:55:21 +03:00
* Returns A pointer to the entity structure or NULL if not found.
*/
xmlEntityPtr
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
xmlEntitiesTablePtr table;
xmlEntityPtr ret;
if (doc == NULL)
return(NULL);
2001-02-23 20:55:21 +03:00
if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
ret = xmlGetEntityFromTable(table, name);
if (ret != NULL)
return(ret);
}
if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
return(xmlGetEntityFromTable(table, name));
}
return(NULL);
}
/**
* xmlGetDtdEntity:
* @doc: the document referencing the entity
* @name: the entity name
*
* Do an entity lookup in the DTD entity hash table and
2001-02-23 20:55:21 +03:00
* returns the corresponding entity, if found.
* Note: the first argument is the document node, not the DTD node.
*
2001-02-23 20:55:21 +03:00
* Returns A pointer to the entity structure or NULL if not found.
*/
xmlEntityPtr
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
xmlEntitiesTablePtr table;
if (doc == NULL)
return(NULL);
2001-02-23 20:55:21 +03:00
if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
table = (xmlEntitiesTablePtr) doc->extSubset->entities;
return(xmlGetEntityFromTable(table, name));
}
return(NULL);
}
/**
* xmlGetDocEntity:
* @doc: the document referencing the entity
* @name: the entity name
*
* Do an entity lookup in the document entity hash table and
* returns the corresponding entity, otherwise a lookup is done
2001-02-23 20:55:21 +03:00
* in the predefined entities too.
*
2001-02-23 20:55:21 +03:00
* Returns A pointer to the entity structure or NULL if not found.
*/
xmlEntityPtr
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
2001-02-23 20:55:21 +03:00
xmlEntityPtr cur;
xmlEntitiesTablePtr table;
if (doc != NULL) {
if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
table = (xmlEntitiesTablePtr) doc->intSubset->entities;
cur = xmlGetEntityFromTable(table, name);
if (cur != NULL)
return(cur);
}
if (doc->standalone != 1) {
if ((doc->extSubset != NULL) &&
(doc->extSubset->entities != NULL)) {
table = (xmlEntitiesTablePtr) doc->extSubset->entities;
cur = xmlGetEntityFromTable(table, name);
if (cur != NULL)
return(cur);
}
2001-02-23 20:55:21 +03:00
}
}
return(xmlGetPredefinedEntity(name));
2001-02-23 20:55:21 +03:00
}
int
xmlSerializeHexCharRef(char *buf, int val) {
char *out = buf;
int shift = 0, bits;
*out++ = '&';
*out++ = '#';
*out++ = 'x';
bits = val;
if (bits & 0xFF0000) {
shift = 16;
bits &= 0xFF0000;
} else if (bits & 0x00FF00) {
shift = 8;
bits &= 0x00FF00;
}
if (bits & 0xF0F0F0) {
shift += 4;
}
do {
int d = (val >> shift) & 0x0F;
if (d < 10)
*out++ = '0' + d;
else
*out++ = 'A' + (d - 10);
shift -= 4;
} while (shift >= 0);
*out++ = ';';
return(out - buf);
}
int
xmlSerializeDecCharRef(char *buf, int val) {
char *out = buf;
int len, i;
*out++ = '&';
*out++ = '#';
if (val < 100) {
len = (val < 10) ? 1 : 2;
} else if (val < 10000) {
len = (val < 1000) ? 3 : 4;
} else if (val < 1000000) {
len = (val < 100000) ? 5 : 6;
} else {
len = 7;
}
for (i = len - 1; i >= 0; i--) {
out[i] = '0' + val % 10;
val /= 10;
}
out[len] = ';';
return(len + 3);
}
2024-07-12 03:01:06 +03:00
static const char xmlEscapeSafe[128] = {
0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
};
2001-02-23 20:55:21 +03:00
2024-07-12 03:01:06 +03:00
xmlChar *
xmlEscapeText(const xmlChar *text, int flags) {
const xmlChar *cur;
xmlChar *buffer;
xmlChar *out;
const xmlChar *unescaped;
size_t size = 50;
buffer = xmlMalloc(size + 1);
if (buffer == NULL)
2024-07-12 03:01:06 +03:00
return(NULL);
2001-02-23 20:55:21 +03:00
out = buffer;
2024-07-12 03:01:06 +03:00
cur = text;
unescaped = cur;
2024-07-12 03:01:06 +03:00
while (*cur != '\0') {
char buf[12];
2024-07-12 03:01:06 +03:00
const xmlChar *end;
const xmlChar *repl;
size_t used;
size_t replSize;
size_t unescapedSize;
size_t totalSize;
int chunkSize = 1;
int c;
/* accelerator */
while (1) {
c = *cur;
if (c < 0x80) {
if (!xmlEscapeSafe[*cur])
break;
} else {
if (flags & XML_ESCAPE_NON_ASCII)
break;
}
cur += 1;
}
if (c == 0) {
chunkSize = 0;
repl = BAD_CAST "";
replSize = 0;
} else if (c == '<') {
/*
* Special handling of server side include in HTML attributes
*/
2024-07-12 03:01:06 +03:00
if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
(cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
2024-07-12 03:01:06 +03:00
chunkSize = (end - cur) + 3;
repl = cur;
replSize = chunkSize;
} else {
repl = BAD_CAST "&lt;";
replSize = 4;
}
} else if (c == '>') {
repl = BAD_CAST "&gt;";
replSize = 4;
} else if (c == '&') {
/*
* Special handling of &{...} construct from HTML 4, see
* http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
*/
2024-07-12 03:01:06 +03:00
if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
(cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
chunkSize = (end - cur) + 1;
repl = cur;
replSize = chunkSize;
2001-02-23 20:55:21 +03:00
} else {
2024-07-12 03:01:06 +03:00
repl = BAD_CAST "&amp;";
replSize = 5;
}
} else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
repl = BAD_CAST "&quot;";
replSize = 6;
} else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
repl = BAD_CAST "&#13;";
replSize = 5;
} else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
int val;
chunkSize = 4;
val = xmlGetUTF8Char(cur, &chunkSize);
if (val < 0) {
val = 0xFFFD;
chunkSize = 1;
} else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
(!IS_CHAR(val))) {
val = 0xFFFD;
}
2001-02-23 20:55:21 +03:00
replSize = xmlSerializeHexCharRef(buf, val);
2024-07-12 03:01:06 +03:00
repl = BAD_CAST buf;
} else if ((flags & XML_ESCAPE_ALLOW_INVALID) ||
(c >= 0x20) ||
(c == '\n') || (c == '\t') || (c == '\r')) {
/* default case, just copy */
cur += 1;
if (*cur != 0)
continue;
chunkSize = 0;
repl = BAD_CAST "";
replSize = 0;
} else {
/* ignore */
repl = BAD_CAST "";
replSize = 0;
}
used = out - buffer;
unescapedSize = cur - unescaped;
totalSize = unescapedSize + replSize;
cur += chunkSize;
if (totalSize > size - used) {
xmlChar *tmp;
size += totalSize;
if (*cur != 0)
size *= 2;
tmp = xmlRealloc(buffer, size + 1);
if (tmp == NULL) {
xmlFree(buffer);
return(NULL);
}
buffer = tmp;
out = buffer + used;
}
memcpy(out, unescaped, unescapedSize);
out += unescapedSize;
memcpy(out, repl, replSize);
out += replSize;
unescaped = cur;
2001-02-23 20:55:21 +03:00
}
2024-07-12 03:01:06 +03:00
*out = 0;
2001-02-23 20:55:21 +03:00
return(buffer);
}
/**
2024-07-12 03:01:06 +03:00
* xmlEncodeEntitiesInternal:
* @doc: the document containing the string
* @input: A string to convert to XML.
2024-07-12 03:01:06 +03:00
* @attr: are we handling an attribute value
*
* Do a global encoding of a string, replacing the predefined entities
2024-07-12 03:01:06 +03:00
* and non ASCII values with their entities and CharRef counterparts.
* Contrary to xmlEncodeEntities, this routine is reentrant, and result
* must be deallocated.
*
* Returns A newly allocated string with the substitution done.
*/
xmlChar *
2024-07-12 03:01:06 +03:00
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
unsigned flags) {
if (input == NULL)
return(NULL);
if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
flags |= XML_ESCAPE_HTML;
else if ((doc == NULL) || (doc->encoding == NULL))
flags |= XML_ESCAPE_NON_ASCII;
return(xmlEscapeText(input, flags));
}
/**
* xmlEncodeEntitiesReentrant:
* @doc: the document containing the string
* @input: A string to convert to XML.
*
* Do a global encoding of a string, replacing the predefined entities
* and non ASCII values with their entities and CharRef counterparts.
* Contrary to xmlEncodeEntities, this routine is reentrant, and result
* must be deallocated.
*
2024-07-12 03:01:06 +03:00
* This escapes '<', '>', '&' and '\r'. If the document has no encoding,
* non-ASCII codepoints are escaped. There is some special handling for
* HTML documents.
*
* Returns A newly allocated string with the substitution done.
*/
xmlChar *
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
return xmlEncodeEntitiesInternal(doc, input, 0);
}
2001-02-23 20:55:21 +03:00
/**
* xmlEncodeSpecialChars:
2024-07-12 03:01:06 +03:00
* @doc: unused
2001-02-23 20:55:21 +03:00
* @input: A string to convert to XML.
*
* Do a global encoding of a string, replacing the predefined entities
* this routine is reentrant, and result must be deallocated.
*
2024-07-12 03:01:06 +03:00
* This escapes '<', '>', '&', '"' and '\r' chars.
*
2001-02-23 20:55:21 +03:00
* Returns A newly allocated string with the substitution done.
*/
xmlChar *
2024-07-12 03:01:06 +03:00
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
const xmlChar *input) {
if (input == NULL)
return(NULL);
2024-07-12 03:01:06 +03:00
return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
2001-02-23 20:55:21 +03:00
}
/**
* xmlCreateEntitiesTable:
*
* create and initialize an empty entities hash table.
* This really doesn't make sense and should be deprecated
2001-02-23 20:55:21 +03:00
*
* Returns the xmlEntitiesTablePtr just created or NULL in case of error.
*/
xmlEntitiesTablePtr
xmlCreateEntitiesTable(void) {
return((xmlEntitiesTablePtr) xmlHashCreate(0));
}
/**
* xmlFreeEntityWrapper:
* @entity: An entity
* @name: its name
*
* Deallocate the memory used by an entities in the hash table.
*/
static void
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
if (entity != NULL)
xmlFreeEntity((xmlEntityPtr) entity);
}
2001-02-23 20:55:21 +03:00
/**
* xmlFreeEntitiesTable:
* @table: An entity table
*
* Deallocate the memory used by an entities hash table.
*/
void
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
xmlHashFree(table, xmlFreeEntityWrapper);
2001-02-23 20:55:21 +03:00
}
/**
* xmlCopyEntity:
* @ent: An entity
*
* Build a copy of an entity
*
2001-02-23 20:55:21 +03:00
* Returns the new xmlEntitiesPtr or NULL in case of error.
*/
static void *
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
xmlEntityPtr ent = (xmlEntityPtr) payload;
2001-02-23 20:55:21 +03:00
xmlEntityPtr cur;
cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
if (cur == NULL)
2001-02-23 20:55:21 +03:00
return(NULL);
memset(cur, 0, sizeof(xmlEntity));
cur->type = XML_ENTITY_DECL;
2001-02-23 20:55:21 +03:00
cur->etype = ent->etype;
if (ent->name != NULL) {
2001-02-23 20:55:21 +03:00
cur->name = xmlStrdup(ent->name);
if (cur->name == NULL)
goto error;
}
if (ent->ExternalID != NULL) {
2001-02-23 20:55:21 +03:00
cur->ExternalID = xmlStrdup(ent->ExternalID);
if (cur->ExternalID == NULL)
goto error;
}
if (ent->SystemID != NULL) {
2001-02-23 20:55:21 +03:00
cur->SystemID = xmlStrdup(ent->SystemID);
if (cur->SystemID == NULL)
goto error;
}
if (ent->content != NULL) {
2001-02-23 20:55:21 +03:00
cur->content = xmlStrdup(ent->content);
if (cur->content == NULL)
goto error;
}
if (ent->orig != NULL) {
2001-02-23 20:55:21 +03:00
cur->orig = xmlStrdup(ent->orig);
if (cur->orig == NULL)
goto error;
}
if (ent->URI != NULL) {
cur->URI = xmlStrdup(ent->URI);
if (cur->URI == NULL)
goto error;
}
2001-02-23 20:55:21 +03:00
return(cur);
error:
xmlFreeEntity(cur);
return(NULL);
2001-02-23 20:55:21 +03:00
}
/**
* xmlCopyEntitiesTable:
* @table: An entity table
*
* Build a copy of an entity table.
*
2001-02-23 20:55:21 +03:00
* Returns the new xmlEntitiesTablePtr or NULL in case of error.
*/
xmlEntitiesTablePtr
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
2001-02-23 20:55:21 +03:00
}
#ifdef LIBXML_OUTPUT_ENABLED
2001-02-23 20:55:21 +03:00
/**
* xmlDumpEntityDecl:
* @buf: An XML buffer.
* @ent: An entity table
*
* This will dump the content of the entity table as an XML DTD definition
*/
void
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
xmlSaveCtxtPtr save;
if ((buf == NULL) || (ent == NULL))
return;
save = xmlSaveToBuffer(buf, NULL, 0);
xmlSaveTree(save, (xmlNodePtr) ent);
if (xmlSaveFinish(save) != XML_ERR_OK)
xmlFree(xmlBufferDetach(buf));
2001-02-23 20:55:21 +03:00
}
/**
* xmlDumpEntityDeclScan:
* @ent: An entity table
* @buf: An XML buffer.
*
* When using the hash table scan function, arguments need to be reversed
*/
static void
xmlDumpEntityDeclScan(void *ent, void *save,
const xmlChar *name ATTRIBUTE_UNUSED) {
xmlSaveTree(save, ent);
}
2001-02-23 20:55:21 +03:00
/**
* xmlDumpEntitiesTable:
* @buf: An XML buffer.
* @table: An entity table
*
* This will dump the content of the entity table as an XML DTD definition
*/
void
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
xmlSaveCtxtPtr save;
if ((buf == NULL) || (table == NULL))
return;
save = xmlSaveToBuffer(buf, NULL, 0);
xmlHashScan(table, xmlDumpEntityDeclScan, save);
if (xmlSaveFinish(save) != XML_ERR_OK)
xmlFree(xmlBufferDetach(buf));
2001-02-23 20:55:21 +03:00
}
#endif /* LIBXML_OUTPUT_ENABLED */