mirror of
https://gitlab.gnome.org/GNOME/libxml2.git
synced 2024-12-25 23:21:26 +03:00
7f3f3f115f
This fixes quadratic behavior with large dictionaries. Also rework testdict.c to support tests with larger dictionaries.
1268 lines
30 KiB
C
1268 lines
30 KiB
C
/*
|
|
* dict.c: dictionary of reusable strings, just used to avoid allocation
|
|
* and freeing operations.
|
|
*
|
|
* Copyright (C) 2003-2012 Daniel Veillard.
|
|
*
|
|
* Permission to use, copy, modify, and distribute this software for any
|
|
* purpose with or without fee is hereby granted, provided that the above
|
|
* copyright notice and this permission notice appear in all copies.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
|
|
* WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
|
|
* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE AUTHORS AND
|
|
* CONTRIBUTORS ACCEPT NO RESPONSIBILITY IN ANY CONCEIVABLE MANNER.
|
|
*
|
|
* Author: daniel@veillard.com
|
|
*/
|
|
|
|
#define IN_LIBXML
|
|
#include "libxml.h"
|
|
|
|
#include <limits.h>
|
|
#include <stdlib.h>
|
|
#include <time.h>
|
|
|
|
#include "private/dict.h"
|
|
#include "private/threads.h"
|
|
|
|
/*
|
|
* Following http://www.ocert.org/advisories/ocert-2011-003.html
|
|
* it seems that having hash randomization might be a good idea
|
|
* when using XML with untrusted data
|
|
* Note1: that it works correctly only if compiled with WITH_BIG_KEY
|
|
* which is the default.
|
|
* Note2: the fast function used for a small dict won't protect very
|
|
* well but since the attack is based on growing a very big hash
|
|
* list we will use the BigKey algo as soon as the hash size grows
|
|
* over MIN_DICT_SIZE so this actually works
|
|
*/
|
|
#if !defined(FUZZING_BUILD_MODE_UNSAFE_FOR_PRODUCTION)
|
|
#define DICT_RANDOMIZATION
|
|
#endif
|
|
|
|
#include <string.h>
|
|
#ifdef HAVE_STDINT_H
|
|
#include <stdint.h>
|
|
#else
|
|
#ifdef HAVE_INTTYPES_H
|
|
#include <inttypes.h>
|
|
#elif defined(_WIN32)
|
|
typedef unsigned __int32 uint32_t;
|
|
#endif
|
|
#endif
|
|
#include <libxml/tree.h>
|
|
#include <libxml/dict.h>
|
|
#include <libxml/xmlmemory.h>
|
|
#include <libxml/xmlerror.h>
|
|
#include <libxml/globals.h>
|
|
|
|
/* #define DEBUG_GROW */
|
|
/* #define DICT_DEBUG_PATTERNS */
|
|
|
|
#define MAX_HASH_LEN 3
|
|
#define MIN_DICT_SIZE 128
|
|
#define MAX_DICT_HASH 100000000
|
|
#define WITH_BIG_KEY
|
|
|
|
#ifdef WITH_BIG_KEY
|
|
#define xmlDictComputeKey(dict, name, len) \
|
|
(((dict)->size == MIN_DICT_SIZE) ? \
|
|
xmlDictComputeFastKey(name, len, (dict)->seed) : \
|
|
xmlDictComputeBigKey(name, len, (dict)->seed))
|
|
|
|
#define xmlDictComputeQKey(dict, prefix, plen, name, len) \
|
|
(((prefix) == NULL) ? \
|
|
(xmlDictComputeKey(dict, name, len)) : \
|
|
(((dict)->size == MIN_DICT_SIZE) ? \
|
|
xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed) : \
|
|
xmlDictComputeBigQKey(prefix, plen, name, len, (dict)->seed)))
|
|
|
|
#else /* !WITH_BIG_KEY */
|
|
#define xmlDictComputeKey(dict, name, len) \
|
|
xmlDictComputeFastKey(name, len, (dict)->seed)
|
|
#define xmlDictComputeQKey(dict, prefix, plen, name, len) \
|
|
xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed)
|
|
#endif /* WITH_BIG_KEY */
|
|
|
|
/*
|
|
* An entry in the dictionary
|
|
*/
|
|
typedef struct _xmlDictEntry xmlDictEntry;
|
|
typedef xmlDictEntry *xmlDictEntryPtr;
|
|
struct _xmlDictEntry {
|
|
struct _xmlDictEntry *next;
|
|
const xmlChar *name;
|
|
unsigned int len;
|
|
int valid;
|
|
unsigned long okey;
|
|
};
|
|
|
|
typedef struct _xmlDictStrings xmlDictStrings;
|
|
typedef xmlDictStrings *xmlDictStringsPtr;
|
|
struct _xmlDictStrings {
|
|
xmlDictStringsPtr next;
|
|
xmlChar *free;
|
|
xmlChar *end;
|
|
size_t size;
|
|
size_t nbStrings;
|
|
xmlChar array[1];
|
|
};
|
|
/*
|
|
* The entire dictionary
|
|
*/
|
|
struct _xmlDict {
|
|
int ref_counter;
|
|
|
|
struct _xmlDictEntry *dict;
|
|
size_t size;
|
|
unsigned int nbElems;
|
|
xmlDictStringsPtr strings;
|
|
|
|
struct _xmlDict *subdict;
|
|
/* used for randomization */
|
|
int seed;
|
|
/* used to impose a limit on size */
|
|
size_t limit;
|
|
};
|
|
|
|
/*
|
|
* A mutex for modifying the reference counter for shared
|
|
* dictionaries.
|
|
*/
|
|
static xmlMutex xmlDictMutex;
|
|
|
|
#ifdef DICT_RANDOMIZATION
|
|
#ifdef HAVE_RAND_R
|
|
/*
|
|
* Internal data for random function, protected by xmlDictMutex
|
|
*/
|
|
static unsigned int rand_seed = 0;
|
|
#endif
|
|
#endif
|
|
|
|
/**
|
|
* xmlInitializeDict:
|
|
*
|
|
* DEPRECATED: Alias for xmlInitParser.
|
|
*/
|
|
int xmlInitializeDict(void) {
|
|
xmlInitParser();
|
|
return(0);
|
|
}
|
|
|
|
/**
|
|
* __xmlInitializeDict:
|
|
*
|
|
* This function is not public
|
|
* Do the dictionary mutex initialization.
|
|
*/
|
|
int __xmlInitializeDict(void) {
|
|
xmlInitMutex(&xmlDictMutex);
|
|
|
|
#ifdef DICT_RANDOMIZATION
|
|
#ifdef HAVE_RAND_R
|
|
rand_seed = time(NULL);
|
|
rand_r(& rand_seed);
|
|
#else
|
|
srand(time(NULL));
|
|
#endif
|
|
#endif
|
|
return(1);
|
|
}
|
|
|
|
#ifdef DICT_RANDOMIZATION
|
|
int __xmlRandom(void) {
|
|
int ret;
|
|
|
|
xmlMutexLock(&xmlDictMutex);
|
|
#ifdef HAVE_RAND_R
|
|
ret = rand_r(& rand_seed);
|
|
#else
|
|
ret = rand();
|
|
#endif
|
|
xmlMutexUnlock(&xmlDictMutex);
|
|
return(ret);
|
|
}
|
|
#endif
|
|
|
|
/**
|
|
* xmlDictCleanup:
|
|
*
|
|
* DEPRECATED: This function is a no-op. Call xmlCleanupParser
|
|
* to free global state but see the warnings there. xmlCleanupParser
|
|
* should be only called once at program exit. In most cases, you don't
|
|
* have call cleanup functions at all.
|
|
*/
|
|
void
|
|
xmlDictCleanup(void) {
|
|
}
|
|
|
|
/**
|
|
* xmlCleanupDictInternal:
|
|
*
|
|
* Free the dictionary mutex.
|
|
*/
|
|
void
|
|
xmlCleanupDictInternal(void) {
|
|
xmlCleanupMutex(&xmlDictMutex);
|
|
}
|
|
|
|
/*
|
|
* xmlDictAddString:
|
|
* @dict: the dictionary
|
|
* @name: the name of the userdata
|
|
* @len: the length of the name
|
|
*
|
|
* Add the string to the array[s]
|
|
*
|
|
* Returns the pointer of the local string, or NULL in case of error.
|
|
*/
|
|
static const xmlChar *
|
|
xmlDictAddString(xmlDictPtr dict, const xmlChar *name, unsigned int namelen) {
|
|
xmlDictStringsPtr pool;
|
|
const xmlChar *ret;
|
|
size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */
|
|
size_t limit = 0;
|
|
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "-");
|
|
#endif
|
|
pool = dict->strings;
|
|
while (pool != NULL) {
|
|
if ((size_t)(pool->end - pool->free) > namelen)
|
|
goto found_pool;
|
|
if (pool->size > size) size = pool->size;
|
|
limit += pool->size;
|
|
pool = pool->next;
|
|
}
|
|
/*
|
|
* Not found, need to allocate
|
|
*/
|
|
if (pool == NULL) {
|
|
if ((dict->limit > 0) && (limit > dict->limit)) {
|
|
return(NULL);
|
|
}
|
|
|
|
if (size == 0) size = 1000;
|
|
else size *= 4; /* exponential growth */
|
|
if (size < 4 * namelen)
|
|
size = 4 * namelen; /* just in case ! */
|
|
pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size);
|
|
if (pool == NULL)
|
|
return(NULL);
|
|
pool->size = size;
|
|
pool->nbStrings = 0;
|
|
pool->free = &pool->array[0];
|
|
pool->end = &pool->array[size];
|
|
pool->next = dict->strings;
|
|
dict->strings = pool;
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "+");
|
|
#endif
|
|
}
|
|
found_pool:
|
|
ret = pool->free;
|
|
memcpy(pool->free, name, namelen);
|
|
pool->free += namelen;
|
|
*(pool->free++) = 0;
|
|
pool->nbStrings++;
|
|
return(ret);
|
|
}
|
|
|
|
/*
|
|
* xmlDictAddQString:
|
|
* @dict: the dictionary
|
|
* @prefix: the prefix of the userdata
|
|
* @plen: the prefix length
|
|
* @name: the name of the userdata
|
|
* @len: the length of the name
|
|
*
|
|
* Add the QName to the array[s]
|
|
*
|
|
* Returns the pointer of the local string, or NULL in case of error.
|
|
*/
|
|
static const xmlChar *
|
|
xmlDictAddQString(xmlDictPtr dict, const xmlChar *prefix, unsigned int plen,
|
|
const xmlChar *name, unsigned int namelen)
|
|
{
|
|
xmlDictStringsPtr pool;
|
|
const xmlChar *ret;
|
|
size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */
|
|
size_t limit = 0;
|
|
|
|
if (prefix == NULL) return(xmlDictAddString(dict, name, namelen));
|
|
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "=");
|
|
#endif
|
|
pool = dict->strings;
|
|
while (pool != NULL) {
|
|
if ((size_t)(pool->end - pool->free) > namelen + plen + 1)
|
|
goto found_pool;
|
|
if (pool->size > size) size = pool->size;
|
|
limit += pool->size;
|
|
pool = pool->next;
|
|
}
|
|
/*
|
|
* Not found, need to allocate
|
|
*/
|
|
if (pool == NULL) {
|
|
if ((dict->limit > 0) && (limit > dict->limit)) {
|
|
return(NULL);
|
|
}
|
|
|
|
if (size == 0) size = 1000;
|
|
else size *= 4; /* exponential growth */
|
|
if (size < 4 * (namelen + plen + 1))
|
|
size = 4 * (namelen + plen + 1); /* just in case ! */
|
|
pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size);
|
|
if (pool == NULL)
|
|
return(NULL);
|
|
pool->size = size;
|
|
pool->nbStrings = 0;
|
|
pool->free = &pool->array[0];
|
|
pool->end = &pool->array[size];
|
|
pool->next = dict->strings;
|
|
dict->strings = pool;
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "+");
|
|
#endif
|
|
}
|
|
found_pool:
|
|
ret = pool->free;
|
|
memcpy(pool->free, prefix, plen);
|
|
pool->free += plen;
|
|
*(pool->free++) = ':';
|
|
memcpy(pool->free, name, namelen);
|
|
pool->free += namelen;
|
|
*(pool->free++) = 0;
|
|
pool->nbStrings++;
|
|
return(ret);
|
|
}
|
|
|
|
#ifdef WITH_BIG_KEY
|
|
/*
|
|
* xmlDictComputeBigKey:
|
|
*
|
|
* Calculate a hash key using a good hash function that works well for
|
|
* larger hash table sizes.
|
|
*
|
|
* Hash function by "One-at-a-Time Hash" see
|
|
* http://burtleburtle.net/bob/hash/doobs.html
|
|
*/
|
|
|
|
#ifdef __clang__
|
|
ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
|
|
ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
|
|
#endif
|
|
static uint32_t
|
|
xmlDictComputeBigKey(const xmlChar* data, int namelen, int seed) {
|
|
uint32_t hash;
|
|
int i;
|
|
|
|
if (namelen <= 0 || data == NULL) return(0);
|
|
|
|
hash = seed;
|
|
|
|
for (i = 0;i < namelen; i++) {
|
|
hash += data[i];
|
|
hash += (hash << 10);
|
|
hash ^= (hash >> 6);
|
|
}
|
|
hash += (hash << 3);
|
|
hash ^= (hash >> 11);
|
|
hash += (hash << 15);
|
|
|
|
return hash;
|
|
}
|
|
|
|
/*
|
|
* xmlDictComputeBigQKey:
|
|
*
|
|
* Calculate a hash key for two strings using a good hash function
|
|
* that works well for larger hash table sizes.
|
|
*
|
|
* Hash function by "One-at-a-Time Hash" see
|
|
* http://burtleburtle.net/bob/hash/doobs.html
|
|
*
|
|
* Neither of the two strings must be NULL.
|
|
*/
|
|
#ifdef __clang__
|
|
ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
|
|
ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
|
|
#endif
|
|
static unsigned long
|
|
xmlDictComputeBigQKey(const xmlChar *prefix, int plen,
|
|
const xmlChar *name, int len, int seed)
|
|
{
|
|
uint32_t hash;
|
|
int i;
|
|
|
|
hash = seed;
|
|
|
|
for (i = 0;i < plen; i++) {
|
|
hash += prefix[i];
|
|
hash += (hash << 10);
|
|
hash ^= (hash >> 6);
|
|
}
|
|
hash += ':';
|
|
hash += (hash << 10);
|
|
hash ^= (hash >> 6);
|
|
|
|
for (i = 0;i < len; i++) {
|
|
hash += name[i];
|
|
hash += (hash << 10);
|
|
hash ^= (hash >> 6);
|
|
}
|
|
hash += (hash << 3);
|
|
hash ^= (hash >> 11);
|
|
hash += (hash << 15);
|
|
|
|
return hash;
|
|
}
|
|
#endif /* WITH_BIG_KEY */
|
|
|
|
/*
|
|
* xmlDictComputeFastKey:
|
|
*
|
|
* Calculate a hash key using a fast hash function that works well
|
|
* for low hash table fill.
|
|
*/
|
|
static unsigned long
|
|
xmlDictComputeFastKey(const xmlChar *name, int namelen, int seed) {
|
|
unsigned long value = seed;
|
|
|
|
if ((name == NULL) || (namelen <= 0))
|
|
return(value);
|
|
value += *name;
|
|
value <<= 5;
|
|
if (namelen > 10) {
|
|
value += name[namelen - 1];
|
|
namelen = 10;
|
|
}
|
|
switch (namelen) {
|
|
case 10: value += name[9];
|
|
/* Falls through. */
|
|
case 9: value += name[8];
|
|
/* Falls through. */
|
|
case 8: value += name[7];
|
|
/* Falls through. */
|
|
case 7: value += name[6];
|
|
/* Falls through. */
|
|
case 6: value += name[5];
|
|
/* Falls through. */
|
|
case 5: value += name[4];
|
|
/* Falls through. */
|
|
case 4: value += name[3];
|
|
/* Falls through. */
|
|
case 3: value += name[2];
|
|
/* Falls through. */
|
|
case 2: value += name[1];
|
|
/* Falls through. */
|
|
default: break;
|
|
}
|
|
return(value);
|
|
}
|
|
|
|
/*
|
|
* xmlDictComputeFastQKey:
|
|
*
|
|
* Calculate a hash key for two strings using a fast hash function
|
|
* that works well for low hash table fill.
|
|
*
|
|
* Neither of the two strings must be NULL.
|
|
*/
|
|
static unsigned long
|
|
xmlDictComputeFastQKey(const xmlChar *prefix, int plen,
|
|
const xmlChar *name, int len, int seed)
|
|
{
|
|
unsigned long value = seed;
|
|
|
|
if (plen == 0)
|
|
value += 30 * ':';
|
|
else
|
|
value += 30 * (*prefix);
|
|
|
|
if (len > 10) {
|
|
int offset = len - (plen + 1 + 1);
|
|
if (offset < 0)
|
|
offset = len - (10 + 1);
|
|
value += name[offset];
|
|
len = 10;
|
|
if (plen > 10)
|
|
plen = 10;
|
|
}
|
|
switch (plen) {
|
|
case 10: value += prefix[9];
|
|
/* Falls through. */
|
|
case 9: value += prefix[8];
|
|
/* Falls through. */
|
|
case 8: value += prefix[7];
|
|
/* Falls through. */
|
|
case 7: value += prefix[6];
|
|
/* Falls through. */
|
|
case 6: value += prefix[5];
|
|
/* Falls through. */
|
|
case 5: value += prefix[4];
|
|
/* Falls through. */
|
|
case 4: value += prefix[3];
|
|
/* Falls through. */
|
|
case 3: value += prefix[2];
|
|
/* Falls through. */
|
|
case 2: value += prefix[1];
|
|
/* Falls through. */
|
|
case 1: value += prefix[0];
|
|
/* Falls through. */
|
|
default: break;
|
|
}
|
|
len -= plen;
|
|
if (len > 0) {
|
|
value += ':';
|
|
len--;
|
|
}
|
|
switch (len) {
|
|
case 10: value += name[9];
|
|
/* Falls through. */
|
|
case 9: value += name[8];
|
|
/* Falls through. */
|
|
case 8: value += name[7];
|
|
/* Falls through. */
|
|
case 7: value += name[6];
|
|
/* Falls through. */
|
|
case 6: value += name[5];
|
|
/* Falls through. */
|
|
case 5: value += name[4];
|
|
/* Falls through. */
|
|
case 4: value += name[3];
|
|
/* Falls through. */
|
|
case 3: value += name[2];
|
|
/* Falls through. */
|
|
case 2: value += name[1];
|
|
/* Falls through. */
|
|
case 1: value += name[0];
|
|
/* Falls through. */
|
|
default: break;
|
|
}
|
|
return(value);
|
|
}
|
|
|
|
/**
|
|
* xmlDictCreate:
|
|
*
|
|
* Create a new dictionary
|
|
*
|
|
* Returns the newly created dictionary, or NULL if an error occurred.
|
|
*/
|
|
xmlDictPtr
|
|
xmlDictCreate(void) {
|
|
xmlDictPtr dict;
|
|
|
|
xmlInitParser();
|
|
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "C");
|
|
#endif
|
|
|
|
dict = xmlMalloc(sizeof(xmlDict));
|
|
if (dict) {
|
|
dict->ref_counter = 1;
|
|
dict->limit = 0;
|
|
|
|
dict->size = MIN_DICT_SIZE;
|
|
dict->nbElems = 0;
|
|
dict->dict = xmlMalloc(MIN_DICT_SIZE * sizeof(xmlDictEntry));
|
|
dict->strings = NULL;
|
|
dict->subdict = NULL;
|
|
if (dict->dict) {
|
|
memset(dict->dict, 0, MIN_DICT_SIZE * sizeof(xmlDictEntry));
|
|
#ifdef DICT_RANDOMIZATION
|
|
dict->seed = __xmlRandom();
|
|
#else
|
|
dict->seed = 0;
|
|
#endif
|
|
return(dict);
|
|
}
|
|
xmlFree(dict);
|
|
}
|
|
return(NULL);
|
|
}
|
|
|
|
/**
|
|
* xmlDictCreateSub:
|
|
* @sub: an existing dictionary
|
|
*
|
|
* Create a new dictionary, inheriting strings from the read-only
|
|
* dictionary @sub. On lookup, strings are first searched in the
|
|
* new dictionary, then in @sub, and if not found are created in the
|
|
* new dictionary.
|
|
*
|
|
* Returns the newly created dictionary, or NULL if an error occurred.
|
|
*/
|
|
xmlDictPtr
|
|
xmlDictCreateSub(xmlDictPtr sub) {
|
|
xmlDictPtr dict = xmlDictCreate();
|
|
|
|
if ((dict != NULL) && (sub != NULL)) {
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "R");
|
|
#endif
|
|
dict->seed = sub->seed;
|
|
dict->subdict = sub;
|
|
xmlDictReference(dict->subdict);
|
|
}
|
|
return(dict);
|
|
}
|
|
|
|
/**
|
|
* xmlDictReference:
|
|
* @dict: the dictionary
|
|
*
|
|
* Increment the reference counter of a dictionary
|
|
*
|
|
* Returns 0 in case of success and -1 in case of error
|
|
*/
|
|
int
|
|
xmlDictReference(xmlDictPtr dict) {
|
|
if (dict == NULL) return -1;
|
|
xmlMutexLock(&xmlDictMutex);
|
|
dict->ref_counter++;
|
|
xmlMutexUnlock(&xmlDictMutex);
|
|
return(0);
|
|
}
|
|
|
|
/**
|
|
* xmlDictGrow:
|
|
* @dict: the dictionary
|
|
* @size: the new size of the dictionary
|
|
*
|
|
* resize the dictionary
|
|
*
|
|
* Returns 0 in case of success, -1 in case of failure
|
|
*/
|
|
static int
|
|
xmlDictGrow(xmlDictPtr dict, size_t size) {
|
|
unsigned long key, okey;
|
|
size_t oldsize, i;
|
|
xmlDictEntryPtr iter, next;
|
|
struct _xmlDictEntry *olddict;
|
|
#ifdef DEBUG_GROW
|
|
unsigned long nbElem = 0;
|
|
#endif
|
|
int ret = 0;
|
|
int keep_keys = 1;
|
|
|
|
if (dict == NULL)
|
|
return(-1);
|
|
if (size < 8)
|
|
return(-1);
|
|
if (size > MAX_DICT_HASH)
|
|
return(-1);
|
|
|
|
#ifdef DICT_DEBUG_PATTERNS
|
|
fprintf(stderr, "*");
|
|
#endif
|
|
|
|
oldsize = dict->size;
|
|
olddict = dict->dict;
|
|
if (olddict == NULL)
|
|
return(-1);
|
|
if (oldsize == MIN_DICT_SIZE)
|
|
keep_keys = 0;
|
|
|
|
dict->dict = xmlMalloc(size * sizeof(xmlDictEntry));
|
|
if (dict->dict == NULL) {
|
|
dict->dict = olddict;
|
|
return(-1);
|
|
}
|
|
memset(dict->dict, 0, size * sizeof(xmlDictEntry));
|
|
dict->size = size;
|
|
|
|
/* If the two loops are merged, there would be situations where
|
|
a new entry needs to allocated and data copied into it from
|
|
the main dict. It is nicer to run through the array twice, first
|
|
copying all the elements in the main array (less probability of
|
|
allocate) and then the rest, so we only free in the second loop.
|
|
*/
|
|
for (i = 0; i < oldsize; i++) {
|
|
if (olddict[i].valid == 0)
|
|
continue;
|
|
|
|
if (keep_keys)
|
|
okey = olddict[i].okey;
|
|
else
|
|
okey = xmlDictComputeKey(dict, olddict[i].name, olddict[i].len);
|
|
key = okey % dict->size;
|
|
|
|
if (dict->dict[key].valid == 0) {
|
|
memcpy(&(dict->dict[key]), &(olddict[i]), sizeof(xmlDictEntry));
|
|
dict->dict[key].next = NULL;
|
|
dict->dict[key].okey = okey;
|
|
} else {
|
|
xmlDictEntryPtr entry;
|
|
|
|
entry = xmlMalloc(sizeof(xmlDictEntry));
|
|
if (entry != NULL) {
|
|
entry->name = olddict[i].name;
|
|
entry->len = olddict[i].len;
|
|
entry->okey = okey;
|
|
entry->next = dict->dict[key].next;
|
|
entry->valid = 1;
|
|
dict->dict[key].next = entry;
|
|
} else {
|
|
/*
|
|
* we don't have much ways to alert from here
|
|
* result is losing an entry and unicity guarantee
|
|
*/
|
|
ret = -1;
|
|
}
|
|
}
|
|
#ifdef DEBUG_GROW
|
|
nbElem++;
|
|
#endif
|
|
}
|
|
|
|
for (i = 0; i < oldsize; i++) {
|
|
iter = olddict[i].next;
|
|
while (iter) {
|
|
next = iter->next;
|
|
|
|
/*
|
|
* put back the entry in the new dict
|
|
*/
|
|
|
|
if (keep_keys)
|
|
okey = iter->okey;
|
|
else
|
|
okey = xmlDictComputeKey(dict, iter->name, iter->len);
|
|
key = okey % dict->size;
|
|
if (dict->dict[key].valid == 0) {
|
|
memcpy(&(dict->dict[key]), iter, sizeof(xmlDictEntry));
|
|
dict->dict[key].next = NULL;
|
|
dict->dict[key].valid = 1;
|
|
dict->dict[key].okey = okey;
|
|
xmlFree(iter);
|
|
} else {
|
|
iter->next = dict->dict[key].next;
|
|
iter->okey = okey;
|
|
dict->dict[key].next = iter;
|
|
}
|
|
|
|
#ifdef DEBUG_GROW
|
|
nbElem++;
|
|
#endif
|
|
|
|
iter = next;
|
|
}
|
|
}
|
|
|
|
xmlFree(olddict);
|
|
|
|
#ifdef DEBUG_GROW
|
|
xmlGenericError(xmlGenericErrorContext,
|
|
"xmlDictGrow : from %lu to %lu, %u elems\n", oldsize, size, nbElem);
|
|
#endif
|
|
|
|
return(ret);
|
|
}
|
|
|
|
/**
|
|
* xmlDictFree:
|
|
* @dict: the dictionary
|
|
*
|
|
* Free the hash @dict and its contents. The userdata is
|
|
* deallocated with @f if provided.
|
|
*/
|
|
void
|
|
xmlDictFree(xmlDictPtr dict) {
|
|
size_t i;
|
|
xmlDictEntryPtr iter;
|
|
xmlDictEntryPtr next;
|
|
int inside_dict = 0;
|
|
xmlDictStringsPtr pool, nextp;
|
|
|
|
if (dict == NULL)
|
|
return;
|
|
|
|
/* decrement the counter, it may be shared by a parser and docs */
|
|
xmlMutexLock(&xmlDictMutex);
|
|
dict->ref_counter--;
|
|
if (dict->ref_counter > 0) {
|
|
xmlMutexUnlock(&xmlDictMutex);
|
|
return;
|
|
}
|
|
|
|
xmlMutexUnlock(&xmlDictMutex);
|
|
|
|
if (dict->subdict != NULL) {
|
|
xmlDictFree(dict->subdict);
|
|
}
|
|
|
|
if (dict->dict) {
|
|
for(i = 0; ((i < dict->size) && (dict->nbElems > 0)); i++) {
|
|
iter = &(dict->dict[i]);
|
|
if (iter->valid == 0)
|
|
continue;
|
|
inside_dict = 1;
|
|
while (iter) {
|
|
next = iter->next;
|
|
if (!inside_dict)
|
|
xmlFree(iter);
|
|
dict->nbElems--;
|
|
inside_dict = 0;
|
|
iter = next;
|
|
}
|
|
}
|
|
xmlFree(dict->dict);
|
|
}
|
|
pool = dict->strings;
|
|
while (pool != NULL) {
|
|
nextp = pool->next;
|
|
xmlFree(pool);
|
|
pool = nextp;
|
|
}
|
|
xmlFree(dict);
|
|
}
|
|
|
|
/**
|
|
* xmlDictLookup:
|
|
* @dict: the dictionary
|
|
* @name: the name of the userdata
|
|
* @len: the length of the name, if -1 it is recomputed
|
|
*
|
|
* Add the @name to the dictionary @dict if not present.
|
|
*
|
|
* Returns the internal copy of the name or NULL in case of internal error
|
|
*/
|
|
const xmlChar *
|
|
xmlDictLookup(xmlDictPtr dict, const xmlChar *name, int len) {
|
|
unsigned long key, okey, nbi = 0;
|
|
xmlDictEntryPtr entry;
|
|
xmlDictEntryPtr insert;
|
|
const xmlChar *ret;
|
|
unsigned int l;
|
|
|
|
if ((dict == NULL) || (name == NULL))
|
|
return(NULL);
|
|
|
|
if (len < 0)
|
|
l = strlen((const char *) name);
|
|
else
|
|
l = len;
|
|
|
|
if (((dict->limit > 0) && (l >= dict->limit)) ||
|
|
(l > INT_MAX / 2))
|
|
return(NULL);
|
|
|
|
/*
|
|
* Check for duplicate and insertion location.
|
|
*/
|
|
okey = xmlDictComputeKey(dict, name, l);
|
|
key = okey % dict->size;
|
|
if (dict->dict[key].valid == 0) {
|
|
insert = NULL;
|
|
} else {
|
|
for (insert = &(dict->dict[key]); insert->next != NULL;
|
|
insert = insert->next) {
|
|
#ifdef __GNUC__
|
|
if ((insert->okey == okey) && (insert->len == l)) {
|
|
if (!memcmp(insert->name, name, l))
|
|
return(insert->name);
|
|
}
|
|
#else
|
|
if ((insert->okey == okey) && (insert->len == l) &&
|
|
(!xmlStrncmp(insert->name, name, l)))
|
|
return(insert->name);
|
|
#endif
|
|
nbi++;
|
|
}
|
|
#ifdef __GNUC__
|
|
if ((insert->okey == okey) && (insert->len == l)) {
|
|
if (!memcmp(insert->name, name, l))
|
|
return(insert->name);
|
|
}
|
|
#else
|
|
if ((insert->okey == okey) && (insert->len == l) &&
|
|
(!xmlStrncmp(insert->name, name, l)))
|
|
return(insert->name);
|
|
#endif
|
|
}
|
|
|
|
if (dict->subdict) {
|
|
unsigned long skey;
|
|
|
|
/* we cannot always reuse the same okey for the subdict */
|
|
if (((dict->size == MIN_DICT_SIZE) &&
|
|
(dict->subdict->size != MIN_DICT_SIZE)) ||
|
|
((dict->size != MIN_DICT_SIZE) &&
|
|
(dict->subdict->size == MIN_DICT_SIZE)))
|
|
skey = xmlDictComputeKey(dict->subdict, name, l);
|
|
else
|
|
skey = okey;
|
|
|
|
key = skey % dict->subdict->size;
|
|
if (dict->subdict->dict[key].valid != 0) {
|
|
xmlDictEntryPtr tmp;
|
|
|
|
for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
|
|
tmp = tmp->next) {
|
|
#ifdef __GNUC__
|
|
if ((tmp->okey == skey) && (tmp->len == l)) {
|
|
if (!memcmp(tmp->name, name, l))
|
|
return(tmp->name);
|
|
}
|
|
#else
|
|
if ((tmp->okey == skey) && (tmp->len == l) &&
|
|
(!xmlStrncmp(tmp->name, name, l)))
|
|
return(tmp->name);
|
|
#endif
|
|
nbi++;
|
|
}
|
|
#ifdef __GNUC__
|
|
if ((tmp->okey == skey) && (tmp->len == l)) {
|
|
if (!memcmp(tmp->name, name, l))
|
|
return(tmp->name);
|
|
}
|
|
#else
|
|
if ((tmp->okey == skey) && (tmp->len == l) &&
|
|
(!xmlStrncmp(tmp->name, name, l)))
|
|
return(tmp->name);
|
|
#endif
|
|
}
|
|
key = okey % dict->size;
|
|
}
|
|
|
|
ret = xmlDictAddString(dict, name, l);
|
|
if (ret == NULL)
|
|
return(NULL);
|
|
if (insert == NULL) {
|
|
entry = &(dict->dict[key]);
|
|
} else {
|
|
entry = xmlMalloc(sizeof(xmlDictEntry));
|
|
if (entry == NULL)
|
|
return(NULL);
|
|
}
|
|
entry->name = ret;
|
|
entry->len = l;
|
|
entry->next = NULL;
|
|
entry->valid = 1;
|
|
entry->okey = okey;
|
|
|
|
|
|
if (insert != NULL)
|
|
insert->next = entry;
|
|
|
|
dict->nbElems++;
|
|
|
|
if ((nbi > MAX_HASH_LEN) &&
|
|
(dict->size <= ((MAX_DICT_HASH / 2) / MAX_HASH_LEN))) {
|
|
if (xmlDictGrow(dict, MAX_HASH_LEN * 2 * dict->size) != 0)
|
|
return(NULL);
|
|
}
|
|
/* Note that entry may have been freed at this point by xmlDictGrow */
|
|
|
|
return(ret);
|
|
}
|
|
|
|
/**
|
|
* xmlDictExists:
|
|
* @dict: the dictionary
|
|
* @name: the name of the userdata
|
|
* @len: the length of the name, if -1 it is recomputed
|
|
*
|
|
* Check if the @name exists in the dictionary @dict.
|
|
*
|
|
* Returns the internal copy of the name or NULL if not found.
|
|
*/
|
|
const xmlChar *
|
|
xmlDictExists(xmlDictPtr dict, const xmlChar *name, int len) {
|
|
unsigned long key, okey;
|
|
xmlDictEntryPtr insert;
|
|
unsigned int l;
|
|
|
|
if ((dict == NULL) || (name == NULL))
|
|
return(NULL);
|
|
|
|
if (len < 0)
|
|
l = strlen((const char *) name);
|
|
else
|
|
l = len;
|
|
if (((dict->limit > 0) && (l >= dict->limit)) ||
|
|
(l > INT_MAX / 2))
|
|
return(NULL);
|
|
|
|
/*
|
|
* Check for duplicate and insertion location.
|
|
*/
|
|
okey = xmlDictComputeKey(dict, name, l);
|
|
key = okey % dict->size;
|
|
if (dict->dict[key].valid == 0) {
|
|
insert = NULL;
|
|
} else {
|
|
for (insert = &(dict->dict[key]); insert->next != NULL;
|
|
insert = insert->next) {
|
|
#ifdef __GNUC__
|
|
if ((insert->okey == okey) && (insert->len == l)) {
|
|
if (!memcmp(insert->name, name, l))
|
|
return(insert->name);
|
|
}
|
|
#else
|
|
if ((insert->okey == okey) && (insert->len == l) &&
|
|
(!xmlStrncmp(insert->name, name, l)))
|
|
return(insert->name);
|
|
#endif
|
|
}
|
|
#ifdef __GNUC__
|
|
if ((insert->okey == okey) && (insert->len == l)) {
|
|
if (!memcmp(insert->name, name, l))
|
|
return(insert->name);
|
|
}
|
|
#else
|
|
if ((insert->okey == okey) && (insert->len == l) &&
|
|
(!xmlStrncmp(insert->name, name, l)))
|
|
return(insert->name);
|
|
#endif
|
|
}
|
|
|
|
if (dict->subdict) {
|
|
unsigned long skey;
|
|
|
|
/* we cannot always reuse the same okey for the subdict */
|
|
if (((dict->size == MIN_DICT_SIZE) &&
|
|
(dict->subdict->size != MIN_DICT_SIZE)) ||
|
|
((dict->size != MIN_DICT_SIZE) &&
|
|
(dict->subdict->size == MIN_DICT_SIZE)))
|
|
skey = xmlDictComputeKey(dict->subdict, name, l);
|
|
else
|
|
skey = okey;
|
|
|
|
key = skey % dict->subdict->size;
|
|
if (dict->subdict->dict[key].valid != 0) {
|
|
xmlDictEntryPtr tmp;
|
|
|
|
for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
|
|
tmp = tmp->next) {
|
|
#ifdef __GNUC__
|
|
if ((tmp->okey == skey) && (tmp->len == l)) {
|
|
if (!memcmp(tmp->name, name, l))
|
|
return(tmp->name);
|
|
}
|
|
#else
|
|
if ((tmp->okey == skey) && (tmp->len == l) &&
|
|
(!xmlStrncmp(tmp->name, name, l)))
|
|
return(tmp->name);
|
|
#endif
|
|
}
|
|
#ifdef __GNUC__
|
|
if ((tmp->okey == skey) && (tmp->len == l)) {
|
|
if (!memcmp(tmp->name, name, l))
|
|
return(tmp->name);
|
|
}
|
|
#else
|
|
if ((tmp->okey == skey) && (tmp->len == l) &&
|
|
(!xmlStrncmp(tmp->name, name, l)))
|
|
return(tmp->name);
|
|
#endif
|
|
}
|
|
}
|
|
|
|
/* not found */
|
|
return(NULL);
|
|
}
|
|
|
|
/**
|
|
* xmlDictQLookup:
|
|
* @dict: the dictionary
|
|
* @prefix: the prefix
|
|
* @name: the name
|
|
*
|
|
* Add the QName @prefix:@name to the hash @dict if not present.
|
|
*
|
|
* Returns the internal copy of the QName or NULL in case of internal error
|
|
*/
|
|
const xmlChar *
|
|
xmlDictQLookup(xmlDictPtr dict, const xmlChar *prefix, const xmlChar *name) {
|
|
unsigned long okey, key, nbi = 0;
|
|
xmlDictEntryPtr entry;
|
|
xmlDictEntryPtr insert;
|
|
const xmlChar *ret;
|
|
unsigned int len, plen, l;
|
|
|
|
if ((dict == NULL) || (name == NULL))
|
|
return(NULL);
|
|
if (prefix == NULL)
|
|
return(xmlDictLookup(dict, name, -1));
|
|
|
|
l = len = strlen((const char *) name);
|
|
plen = strlen((const char *) prefix);
|
|
len += 1 + plen;
|
|
|
|
/*
|
|
* Check for duplicate and insertion location.
|
|
*/
|
|
okey = xmlDictComputeQKey(dict, prefix, plen, name, l);
|
|
key = okey % dict->size;
|
|
if (dict->dict[key].valid == 0) {
|
|
insert = NULL;
|
|
} else {
|
|
for (insert = &(dict->dict[key]); insert->next != NULL;
|
|
insert = insert->next) {
|
|
if ((insert->okey == okey) && (insert->len == len) &&
|
|
(xmlStrQEqual(prefix, name, insert->name)))
|
|
return(insert->name);
|
|
nbi++;
|
|
}
|
|
if ((insert->okey == okey) && (insert->len == len) &&
|
|
(xmlStrQEqual(prefix, name, insert->name)))
|
|
return(insert->name);
|
|
}
|
|
|
|
if (dict->subdict) {
|
|
unsigned long skey;
|
|
|
|
/* we cannot always reuse the same okey for the subdict */
|
|
if (((dict->size == MIN_DICT_SIZE) &&
|
|
(dict->subdict->size != MIN_DICT_SIZE)) ||
|
|
((dict->size != MIN_DICT_SIZE) &&
|
|
(dict->subdict->size == MIN_DICT_SIZE)))
|
|
skey = xmlDictComputeQKey(dict->subdict, prefix, plen, name, l);
|
|
else
|
|
skey = okey;
|
|
|
|
key = skey % dict->subdict->size;
|
|
if (dict->subdict->dict[key].valid != 0) {
|
|
xmlDictEntryPtr tmp;
|
|
for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
|
|
tmp = tmp->next) {
|
|
if ((tmp->okey == skey) && (tmp->len == len) &&
|
|
(xmlStrQEqual(prefix, name, tmp->name)))
|
|
return(tmp->name);
|
|
nbi++;
|
|
}
|
|
if ((tmp->okey == skey) && (tmp->len == len) &&
|
|
(xmlStrQEqual(prefix, name, tmp->name)))
|
|
return(tmp->name);
|
|
}
|
|
key = okey % dict->size;
|
|
}
|
|
|
|
ret = xmlDictAddQString(dict, prefix, plen, name, l);
|
|
if (ret == NULL)
|
|
return(NULL);
|
|
if (insert == NULL) {
|
|
entry = &(dict->dict[key]);
|
|
} else {
|
|
entry = xmlMalloc(sizeof(xmlDictEntry));
|
|
if (entry == NULL)
|
|
return(NULL);
|
|
}
|
|
entry->name = ret;
|
|
entry->len = len;
|
|
entry->next = NULL;
|
|
entry->valid = 1;
|
|
entry->okey = okey;
|
|
|
|
if (insert != NULL)
|
|
insert->next = entry;
|
|
|
|
dict->nbElems++;
|
|
|
|
if ((nbi > MAX_HASH_LEN) &&
|
|
(dict->size <= ((MAX_DICT_HASH / 2) / MAX_HASH_LEN)))
|
|
xmlDictGrow(dict, MAX_HASH_LEN * 2 * dict->size);
|
|
/* Note that entry may have been freed at this point by xmlDictGrow */
|
|
|
|
return(ret);
|
|
}
|
|
|
|
/**
|
|
* xmlDictOwns:
|
|
* @dict: the dictionary
|
|
* @str: the string
|
|
*
|
|
* check if a string is owned by the dictionary
|
|
*
|
|
* Returns 1 if true, 0 if false and -1 in case of error
|
|
* -1 in case of error
|
|
*/
|
|
int
|
|
xmlDictOwns(xmlDictPtr dict, const xmlChar *str) {
|
|
xmlDictStringsPtr pool;
|
|
|
|
if ((dict == NULL) || (str == NULL))
|
|
return(-1);
|
|
pool = dict->strings;
|
|
while (pool != NULL) {
|
|
if ((str >= &pool->array[0]) && (str <= pool->free))
|
|
return(1);
|
|
pool = pool->next;
|
|
}
|
|
if (dict->subdict)
|
|
return(xmlDictOwns(dict->subdict, str));
|
|
return(0);
|
|
}
|
|
|
|
/**
|
|
* xmlDictSize:
|
|
* @dict: the dictionary
|
|
*
|
|
* Query the number of elements installed in the hash @dict.
|
|
*
|
|
* Returns the number of elements in the dictionary or
|
|
* -1 in case of error
|
|
*/
|
|
int
|
|
xmlDictSize(xmlDictPtr dict) {
|
|
if (dict == NULL)
|
|
return(-1);
|
|
if (dict->subdict)
|
|
return(dict->nbElems + dict->subdict->nbElems);
|
|
return(dict->nbElems);
|
|
}
|
|
|
|
/**
|
|
* xmlDictSetLimit:
|
|
* @dict: the dictionary
|
|
* @limit: the limit in bytes
|
|
*
|
|
* Set a size limit for the dictionary
|
|
* Added in 2.9.0
|
|
*
|
|
* Returns the previous limit of the dictionary or 0
|
|
*/
|
|
size_t
|
|
xmlDictSetLimit(xmlDictPtr dict, size_t limit) {
|
|
size_t ret;
|
|
|
|
if (dict == NULL)
|
|
return(0);
|
|
ret = dict->limit;
|
|
dict->limit = limit;
|
|
return(ret);
|
|
}
|
|
|
|
/**
|
|
* xmlDictGetUsage:
|
|
* @dict: the dictionary
|
|
*
|
|
* Get how much memory is used by a dictionary for strings
|
|
* Added in 2.9.0
|
|
*
|
|
* Returns the amount of strings allocated
|
|
*/
|
|
size_t
|
|
xmlDictGetUsage(xmlDictPtr dict) {
|
|
xmlDictStringsPtr pool;
|
|
size_t limit = 0;
|
|
|
|
if (dict == NULL)
|
|
return(0);
|
|
pool = dict->strings;
|
|
while (pool != NULL) {
|
|
limit += pool->size;
|
|
pool = pool->next;
|
|
}
|
|
return(limit);
|
|
}
|
|
|