dict.c - platform/external/libxml2 - Git at Google

 /*
  * dict.c: dictionary of reusable strings, just used to avoid allocation
  *         and freeing operations.
  *
  * Copyright (C) 2003-2012 Daniel Veillard.
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
  * copyright notice and this permission notice appear in all copies.
  *
  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED
  * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF
  * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE AUTHORS AND
  * CONTRIBUTORS ACCEPT NO RESPONSIBILITY IN ANY CONCEIVABLE MANNER.
  *
  * Author: daniel@veillard.com
  */

 #define IN_LIBXML
 #include "libxml.h"

 #include <limits.h>
 #include <string.h>
 #include <time.h>

 #include "private/dict.h"
 #include "private/threads.h"

 #include <libxml/tree.h>
 #include <libxml/dict.h>
 #include <libxml/xmlmemory.h>
 #include <libxml/xmlerror.h>
 #include <libxml/globals.h>

 /*
  * Following http://www.ocert.org/advisories/ocert-2011-003.html
  * it seems that having hash randomization might be a good idea
  * when using XML with untrusted data
  * Note1: that it works correctly only if compiled with WITH_BIG_KEY
  *  which is the default.
  * Note2: the fast function used for a small dict won't protect very
  *  well but since the attack is based on growing a very big hash
  *  list we will use the BigKey algo as soon as the hash size grows
  *  over MIN_DICT_SIZE so this actually works
  */
 #if !defined(FUZZING_BUILD_MODE_UNSAFE_FOR_PRODUCTION)
 #define DICT_RANDOMIZATION
 #endif

 /* #define DEBUG_GROW */
 /* #define DICT_DEBUG_PATTERNS */

 #define MAX_HASH_LEN 16
 #define MAX_FILL 2
 #define GROWTH_FACTOR 4
 #define MIN_DICT_SIZE 128
 #define WITH_BIG_KEY

 #ifdef WITH_BIG_KEY
 #define xmlDictComputeKey(dict, name, len)                              \
     (((dict)->size == MIN_DICT_SIZE) ?                                  \
      xmlDictComputeFastKey(name, len, (dict)->seed) :                   \
      xmlDictComputeBigKey(name, len, (dict)->seed))

 #define xmlDictComputeQKey(dict, prefix, plen, name, len)               \
     (((prefix) == NULL) ?                                               \
       (xmlDictComputeKey(dict, name, len)) :                             \
       (((dict)->size == MIN_DICT_SIZE) ?                                \
        xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed) :	\
        xmlDictComputeBigQKey(prefix, plen, name, len, (dict)->seed)))

 #else /* !WITH_BIG_KEY */
 #define xmlDictComputeKey(dict, name, len)                              \
         xmlDictComputeFastKey(name, len, (dict)->seed)
 #define xmlDictComputeQKey(dict, prefix, plen, name, len)               \
         xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed)
 #endif /* WITH_BIG_KEY */

 /*
  * An entry in the dictionary
  */
 typedef struct _xmlDictEntry xmlDictEntry;
 typedef xmlDictEntry *xmlDictEntryPtr;
 struct _xmlDictEntry {
     struct _xmlDictEntry *next;
     const xmlChar *name;
     unsigned int len;
     int valid;
     unsigned okey;
 };

 typedef struct _xmlDictStrings xmlDictStrings;
 typedef xmlDictStrings *xmlDictStringsPtr;
 struct _xmlDictStrings {
     xmlDictStringsPtr next;
     xmlChar *free;
     xmlChar *end;
     size_t size;
     size_t nbStrings;
     xmlChar array[1];
 };
 /*
  * The entire dictionary
  */
 struct _xmlDict {
     int ref_counter;

     struct _xmlDictEntry *dict;
     size_t size;
     unsigned int nbElems;
     xmlDictStringsPtr strings;

     struct _xmlDict *subdict;
     /* used for randomization */
     unsigned seed;
     /* used to impose a limit on size */
     size_t limit;
 };

 /*
  * A mutex for modifying the reference counter for shared
  * dictionaries.
  */
 static xmlMutex xmlDictMutex;

 /*
  * Internal data for random function, protected by xmlDictMutex
  */
 static unsigned globalRngState[2];

 #ifdef XML_THREAD_LOCAL
 XML_THREAD_LOCAL static int localRngInitialized = 0;
 XML_THREAD_LOCAL static unsigned localRngState[2];
 #endif

 /**
  * xmlInitializeDict:
  *
  * DEPRECATED: Alias for xmlInitParser.
  */
 int
 xmlInitializeDict(void) {
     xmlInitParser();
     return(0);
 }

 /**
  * xmlInitializeDict:
  *
  * Initialize mutex and global PRNG seed.
  */
 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 void
 xmlInitDictInternal(void) {
     int var;

     xmlInitMutex(&xmlDictMutex);

     /* TODO: Get seed values from system PRNG */

     globalRngState[0] = (unsigned) time(NULL) ^
                         HASH_ROL((unsigned) (size_t) &xmlInitializeDict, 8);
     globalRngState[1] = HASH_ROL((unsigned) (size_t) &xmlDictMutex, 16) ^
                         HASH_ROL((unsigned) (size_t) &var, 24);
 }

 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 static unsigned
 xoroshiro64ss(unsigned *s) {
     unsigned s0 = s[0];
     unsigned s1 = s[1];
     unsigned result = HASH_ROL(s0 * 0x9E3779BB, 5) * 5;

     s1 ^= s0;
     s[0] = HASH_ROL(s0, 26) ^ s1 ^ (s1 << 9);
     s[1] = HASH_ROL(s1, 13);

     return(result & 0xFFFFFFFF);
 }

 unsigned
 xmlRandom(void) {
 #ifdef XML_THREAD_LOCAL
     if (!localRngInitialized) {
         xmlMutexLock(&xmlDictMutex);
         localRngState[0] = xoroshiro64ss(globalRngState);
         localRngState[1] = xoroshiro64ss(globalRngState);
         localRngInitialized = 1;
         xmlMutexUnlock(&xmlDictMutex);
     }

     return(xoroshiro64ss(localRngState));
 #else
     unsigned ret;

     xmlMutexLock(&xmlDictMutex);
     ret = xoroshiro64ss(globalRngState);
     xmlMutexUnlock(&xmlDictMutex);

     return(ret);
 #endif
 }

 /**
  * xmlDictCleanup:
  *
  * DEPRECATED: This function is a no-op. Call xmlCleanupParser
  * to free global state but see the warnings there. xmlCleanupParser
  * should be only called once at program exit. In most cases, you don't
  * have call cleanup functions at all.
  */
 void
 xmlDictCleanup(void) {
 }

 /**
  * xmlCleanupDictInternal:
  *
  * Free the dictionary mutex.
  */
 void
 xmlCleanupDictInternal(void) {
     xmlCleanupMutex(&xmlDictMutex);
 }

 /*
  * xmlDictAddString:
  * @dict: the dictionary
  * @name: the name of the userdata
  * @len: the length of the name
  *
  * Add the string to the array[s]
  *
  * Returns the pointer of the local string, or NULL in case of error.
  */
 static const xmlChar *
 xmlDictAddString(xmlDictPtr dict, const xmlChar *name, unsigned int namelen) {
     xmlDictStringsPtr pool;
     const xmlChar *ret;
     size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */
     size_t limit = 0;

 #ifdef DICT_DEBUG_PATTERNS
     fprintf(stderr, "-");
 #endif
     pool = dict->strings;
     while (pool != NULL) {
 	if ((size_t)(pool->end - pool->free) > namelen)
 	    goto found_pool;
 	if (pool->size > size) size = pool->size;
         limit += pool->size;
 	pool = pool->next;
     }
     /*
      * Not found, need to allocate
      */
     if (pool == NULL) {
         if ((dict->limit > 0) && (limit > dict->limit)) {
             return(NULL);
         }

         if (size == 0) size = 1000;
 	else size *= 4; /* exponential growth */
         if (size < 4 * namelen)
 	    size = 4 * namelen; /* just in case ! */
 	pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size);
 	if (pool == NULL)
 	    return(NULL);
 	pool->size = size;
 	pool->nbStrings = 0;
 	pool->free = &pool->array[0];
 	pool->end = &pool->array[size];
 	pool->next = dict->strings;
 	dict->strings = pool;
 #ifdef DICT_DEBUG_PATTERNS
         fprintf(stderr, "+");
 #endif
     }
 found_pool:
     ret = pool->free;
     memcpy(pool->free, name, namelen);
     pool->free += namelen;
     *(pool->free++) = 0;
     pool->nbStrings++;
     return(ret);
 }

 /*
  * xmlDictAddQString:
  * @dict: the dictionary
  * @prefix: the prefix of the userdata
  * @plen: the prefix length
  * @name: the name of the userdata
  * @len: the length of the name
  *
  * Add the QName to the array[s]
  *
  * Returns the pointer of the local string, or NULL in case of error.
  */
 static const xmlChar *
 xmlDictAddQString(xmlDictPtr dict, const xmlChar *prefix, unsigned int plen,
                  const xmlChar *name, unsigned int namelen)
 {
     xmlDictStringsPtr pool;
     const xmlChar *ret;
     size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */
     size_t limit = 0;

     if (prefix == NULL) return(xmlDictAddString(dict, name, namelen));

 #ifdef DICT_DEBUG_PATTERNS
     fprintf(stderr, "=");
 #endif
     pool = dict->strings;
     while (pool != NULL) {
 	if ((size_t)(pool->end - pool->free) > namelen + plen + 1)
 	    goto found_pool;
 	if (pool->size > size) size = pool->size;
         limit += pool->size;
 	pool = pool->next;
     }
     /*
      * Not found, need to allocate
      */
     if (pool == NULL) {
         if ((dict->limit > 0) && (limit > dict->limit)) {
             return(NULL);
         }

         if (size == 0) size = 1000;
 	else size *= 4; /* exponential growth */
         if (size < 4 * (namelen + plen + 1))
 	    size = 4 * (namelen + plen + 1); /* just in case ! */
 	pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size);
 	if (pool == NULL)
 	    return(NULL);
 	pool->size = size;
 	pool->nbStrings = 0;
 	pool->free = &pool->array[0];
 	pool->end = &pool->array[size];
 	pool->next = dict->strings;
 	dict->strings = pool;
 #ifdef DICT_DEBUG_PATTERNS
         fprintf(stderr, "+");
 #endif
     }
 found_pool:
     ret = pool->free;
     memcpy(pool->free, prefix, plen);
     pool->free += plen;
     *(pool->free++) = ':';
     memcpy(pool->free, name, namelen);
     pool->free += namelen;
     *(pool->free++) = 0;
     pool->nbStrings++;
     return(ret);
 }

 #ifdef WITH_BIG_KEY
 /*
  * xmlDictComputeBigKey:
  *
  * Calculate a hash key using a good hash function that works well for
  * larger hash table sizes.
  */

 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 static unsigned
 xmlDictComputeBigKey(const xmlChar* data, int namelen, unsigned seed) {
     unsigned h1, h2;
     int i;

     if (namelen <= 0 || data == NULL) return(0);

     HASH_INIT(h1, h2, seed);

     for (i = 0; i < namelen; i++) {
         HASH_UPDATE(h1, h2, data[i]);
     }

     HASH_FINISH(h1, h2);

     return h2;
 }

 /*
  * xmlDictComputeBigQKey:
  *
  * Calculate a hash key for two strings using a good hash function
  * that works well for larger hash table sizes.
  *
  * Hash function by "One-at-a-Time Hash" see
  * http://burtleburtle.net/bob/hash/doobs.html
  *
  * Neither of the two strings must be NULL.
  */
 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 static unsigned
 xmlDictComputeBigQKey(const xmlChar *prefix, int plen,
                       const xmlChar *name, int len, unsigned seed)
 {
     unsigned h1, h2;
     int i;

     HASH_INIT(h1, h2, seed);

     for (i = 0; i < plen; i++) {
         HASH_UPDATE(h1, h2, prefix[i]);
     }
     HASH_UPDATE(h1, h2, ':');

     for (i = 0; i < len; i++) {
         HASH_UPDATE(h1, h2, name[i]);
     }

     HASH_FINISH(h1, h2);

     return h2;
 }
 #endif /* WITH_BIG_KEY */

 /*
  * xmlDictComputeFastKey:
  *
  * Calculate a hash key using a fast hash function that works well
  * for low hash table fill.
  */
 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 static unsigned
 xmlDictComputeFastKey(const xmlChar *name, int namelen, unsigned seed) {
     unsigned value = seed;

     if ((name == NULL) || (namelen <= 0))
         return(value);
     value += *name;
     value <<= 5;
     if (namelen > 10) {
         value += name[namelen - 1];
         namelen = 10;
     }
     switch (namelen) {
         case 10: value += name[9];
         /* Falls through. */
         case 9: value += name[8];
         /* Falls through. */
         case 8: value += name[7];
         /* Falls through. */
         case 7: value += name[6];
         /* Falls through. */
         case 6: value += name[5];
         /* Falls through. */
         case 5: value += name[4];
         /* Falls through. */
         case 4: value += name[3];
         /* Falls through. */
         case 3: value += name[2];
         /* Falls through. */
         case 2: value += name[1];
         /* Falls through. */
         default: break;
     }
     return(value);
 }

 /*
  * xmlDictComputeFastQKey:
  *
  * Calculate a hash key for two strings using a fast hash function
  * that works well for low hash table fill.
  *
  * Neither of the two strings must be NULL.
  */
 #ifdef __clang__
 ATTRIBUTE_NO_SANITIZE("unsigned-integer-overflow")
 ATTRIBUTE_NO_SANITIZE("unsigned-shift-base")
 #endif
 static unsigned
 xmlDictComputeFastQKey(const xmlChar *prefix, int plen,
                        const xmlChar *name, int len, unsigned seed)
 {
     unsigned value = seed;

     if (plen == 0)
 	value += 30 * ':';
     else
 	value += 30 * (*prefix);

     if (len > 10) {
         int offset = len - (plen + 1 + 1);
 	if (offset < 0)
 	    offset = len - (10 + 1);
 	value += name[offset];
         len = 10;
 	if (plen > 10)
 	    plen = 10;
     }
     switch (plen) {
         case 10: value += prefix[9];
         /* Falls through. */
         case 9: value += prefix[8];
         /* Falls through. */
         case 8: value += prefix[7];
         /* Falls through. */
         case 7: value += prefix[6];
         /* Falls through. */
         case 6: value += prefix[5];
         /* Falls through. */
         case 5: value += prefix[4];
         /* Falls through. */
         case 4: value += prefix[3];
         /* Falls through. */
         case 3: value += prefix[2];
         /* Falls through. */
         case 2: value += prefix[1];
         /* Falls through. */
         case 1: value += prefix[0];
         /* Falls through. */
         default: break;
     }
     len -= plen;
     if (len > 0) {
         value += ':';
 	len--;
     }
     switch (len) {
         case 10: value += name[9];
         /* Falls through. */
         case 9: value += name[8];
         /* Falls through. */
         case 8: value += name[7];
         /* Falls through. */
         case 7: value += name[6];
         /* Falls through. */
         case 6: value += name[5];
         /* Falls through. */
         case 5: value += name[4];
         /* Falls through. */
         case 4: value += name[3];
         /* Falls through. */
         case 3: value += name[2];
         /* Falls through. */
         case 2: value += name[1];
         /* Falls through. */
         case 1: value += name[0];
         /* Falls through. */
         default: break;
     }
     return(value);
 }

 /**
  * xmlDictCreate:
  *
  * Create a new dictionary
  *
  * Returns the newly created dictionary, or NULL if an error occurred.
  */
 xmlDictPtr
 xmlDictCreate(void) {
     xmlDictPtr dict;

     xmlInitParser();

 #ifdef DICT_DEBUG_PATTERNS
     fprintf(stderr, "C");
 #endif

     dict = xmlMalloc(sizeof(xmlDict));
     if (dict) {
         dict->ref_counter = 1;
         dict->limit = 0;

         dict->size = MIN_DICT_SIZE;
 	dict->nbElems = 0;
         dict->dict = xmlMalloc(MIN_DICT_SIZE * sizeof(xmlDictEntry));
 	dict->strings = NULL;
 	dict->subdict = NULL;
         if (dict->dict) {
 	    memset(dict->dict, 0, MIN_DICT_SIZE * sizeof(xmlDictEntry));
 #ifdef DICT_RANDOMIZATION
             dict->seed = xmlRandom();
 #else
             dict->seed = 0;
 #endif
 	    return(dict);
         }
         xmlFree(dict);
     }
     return(NULL);
 }

 /**
  * xmlDictCreateSub:
  * @sub: an existing dictionary
  *
  * Create a new dictionary, inheriting strings from the read-only
  * dictionary @sub. On lookup, strings are first searched in the
  * new dictionary, then in @sub, and if not found are created in the
  * new dictionary.
  *
  * Returns the newly created dictionary, or NULL if an error occurred.
  */
 xmlDictPtr
 xmlDictCreateSub(xmlDictPtr sub) {
     xmlDictPtr dict = xmlDictCreate();

     if ((dict != NULL) && (sub != NULL)) {
 #ifdef DICT_DEBUG_PATTERNS
         fprintf(stderr, "R");
 #endif
         dict->seed = sub->seed;
         dict->subdict = sub;
 	xmlDictReference(dict->subdict);
     }
     return(dict);
 }

 /**
  * xmlDictReference:
  * @dict: the dictionary
  *
  * Increment the reference counter of a dictionary
  *
  * Returns 0 in case of success and -1 in case of error
  */
 int
 xmlDictReference(xmlDictPtr dict) {
     if (dict == NULL) return -1;
     xmlMutexLock(&xmlDictMutex);
     dict->ref_counter++;
     xmlMutexUnlock(&xmlDictMutex);
     return(0);
 }

 /**
  * xmlDictGrow:
  * @dict: the dictionary
  * @size: the new size of the dictionary
  *
  * resize the dictionary
  *
  * Returns 0 in case of success, -1 in case of failure
  */
 static int
 xmlDictGrow(xmlDictPtr dict, size_t size) {
     unsigned key, okey;
     size_t oldsize, i;
     xmlDictEntryPtr iter, next;
     struct _xmlDictEntry *olddict;
 #ifdef DEBUG_GROW
     unsigned nbElem = 0;
 #endif
     int ret = 0;
     int keep_keys = 1;

     if (dict == NULL)
 	return(-1);
     oldsize = dict->size;
     if (size <= oldsize)
 	return(0);

 #ifdef DICT_DEBUG_PATTERNS
     fprintf(stderr, "*");
 #endif

     olddict = dict->dict;
     if (olddict == NULL)
         return(-1);
     if (oldsize == MIN_DICT_SIZE)
         keep_keys = 0;

     dict->dict = xmlMalloc(size * sizeof(xmlDictEntry));
     if (dict->dict == NULL) {
 	dict->dict = olddict;
 	return(-1);
     }
     memset(dict->dict, 0, size * sizeof(xmlDictEntry));
     dict->size = size;

     /*	If the two loops are merged, there would be situations where
 	a new entry needs to allocated and data copied into it from
 	the main dict. It is nicer to run through the array twice, first
 	copying all the elements in the main array (less probability of
 	allocate) and then the rest, so we only free in the second loop.
     */
     for (i = 0; i < oldsize; i++) {
 	if (olddict[i].valid == 0)
 	    continue;

 	if (keep_keys)
 	    okey = olddict[i].okey;
 	else
 	    okey = xmlDictComputeKey(dict, olddict[i].name, olddict[i].len);
 	key = okey % dict->size;

 	if (dict->dict[key].valid == 0) {
 	    memcpy(&(dict->dict[key]), &(olddict[i]), sizeof(xmlDictEntry));
 	    dict->dict[key].next = NULL;
 	    dict->dict[key].okey = okey;
 	} else {
 	    xmlDictEntryPtr entry;

 	    entry = xmlMalloc(sizeof(xmlDictEntry));
 	    if (entry != NULL) {
 		entry->name = olddict[i].name;
 		entry->len = olddict[i].len;
 		entry->okey = okey;
 		entry->next = dict->dict[key].next;
 		entry->valid = 1;
 		dict->dict[key].next = entry;
 	    } else {
 	        /*
 		 * we don't have much ways to alert from here
 		 * result is losing an entry and unicity guarantee
 		 */
 	        ret = -1;
 	    }
 	}
 #ifdef DEBUG_GROW
 	nbElem++;
 #endif
     }

     for (i = 0; i < oldsize; i++) {
 	iter = olddict[i].next;
 	while (iter) {
 	    next = iter->next;

 	    /*
 	     * put back the entry in the new dict
 	     */

 	    if (keep_keys)
 		okey = iter->okey;
 	    else
 		okey = xmlDictComputeKey(dict, iter->name, iter->len);
 	    key = okey % dict->size;
 	    if (dict->dict[key].valid == 0) {
 		memcpy(&(dict->dict[key]), iter, sizeof(xmlDictEntry));
 		dict->dict[key].next = NULL;
 		dict->dict[key].valid = 1;
 		dict->dict[key].okey = okey;
 		xmlFree(iter);
 	    } else {
 		iter->next = dict->dict[key].next;
 		iter->okey = okey;
 		dict->dict[key].next = iter;
 	    }

 #ifdef DEBUG_GROW
 	    nbElem++;
 #endif

 	    iter = next;
 	}
     }

     xmlFree(olddict);

 #ifdef DEBUG_GROW
     xmlGenericError(xmlGenericErrorContext,
 	    "xmlDictGrow : from %lu to %lu, %u elems\n", oldsize, size, nbElem);
 #endif

     return(ret);
 }

 /**
  * xmlDictFree:
  * @dict: the dictionary
  *
  * Free the hash @dict and its contents. The userdata is
  * deallocated with @f if provided.
  */
 void
 xmlDictFree(xmlDictPtr dict) {
     size_t i;
     xmlDictEntryPtr iter;
     xmlDictEntryPtr next;
     int inside_dict = 0;
     xmlDictStringsPtr pool, nextp;

     if (dict == NULL)
 	return;

     /* decrement the counter, it may be shared by a parser and docs */
     xmlMutexLock(&xmlDictMutex);
     dict->ref_counter--;
     if (dict->ref_counter > 0) {
         xmlMutexUnlock(&xmlDictMutex);
         return;
     }

     xmlMutexUnlock(&xmlDictMutex);

     if (dict->subdict != NULL) {
         xmlDictFree(dict->subdict);
     }

     if (dict->dict) {
 	for(i = 0; ((i < dict->size) && (dict->nbElems > 0)); i++) {
 	    iter = &(dict->dict[i]);
 	    if (iter->valid == 0)
 		continue;
 	    inside_dict = 1;
 	    while (iter) {
 		next = iter->next;
 		if (!inside_dict)
 		    xmlFree(iter);
 		dict->nbElems--;
 		inside_dict = 0;
 		iter = next;
 	    }
 	}
 	xmlFree(dict->dict);
     }
     pool = dict->strings;
     while (pool != NULL) {
         nextp = pool->next;
 	xmlFree(pool);
 	pool = nextp;
     }
     xmlFree(dict);
 }

 /**
  * xmlDictLookup:
  * @dict: the dictionary
  * @name: the name of the userdata
  * @len: the length of the name, if -1 it is recomputed
  *
  * Add the @name to the dictionary @dict if not present.
  *
  * Returns the internal copy of the name or NULL in case of internal error
  */
 const xmlChar *
 xmlDictLookup(xmlDictPtr dict, const xmlChar *name, int len) {
     unsigned key, okey, nbi = 0;
     xmlDictEntryPtr entry;
     xmlDictEntryPtr insert;
     const xmlChar *ret;
     size_t l;

     if ((dict == NULL) || (name == NULL))
 	return(NULL);

     if (len < 0)
         l = strlen((const char *) name);
     else
         l = len;

     if (((dict->limit > 0) && (l >= dict->limit)) ||
         (l > INT_MAX / 2))
         return(NULL);

     /*
      * Check for duplicate and insertion location.
      */
     okey = xmlDictComputeKey(dict, name, l);
     key = okey % dict->size;
     if (dict->dict[key].valid == 0) {
 	insert = NULL;
     } else {
 	for (insert = &(dict->dict[key]); insert->next != NULL;
 	     insert = insert->next) {
 #ifdef __GNUC__
 	    if ((insert->okey == okey) && (insert->len == l)) {
 		if (!memcmp(insert->name, name, l))
 		    return(insert->name);
 	    }
 #else
 	    if ((insert->okey == okey) && (insert->len == l) &&
 	        (!xmlStrncmp(insert->name, name, l)))
 		return(insert->name);
 #endif
 	    nbi++;
 	}
 #ifdef __GNUC__
 	if ((insert->okey == okey) && (insert->len == l)) {
 	    if (!memcmp(insert->name, name, l))
 		return(insert->name);
 	}
 #else
 	if ((insert->okey == okey) && (insert->len == l) &&
 	    (!xmlStrncmp(insert->name, name, l)))
 	    return(insert->name);
 #endif
     }

     if (dict->subdict) {
         unsigned skey;

         /* we cannot always reuse the same okey for the subdict */
         if (((dict->size == MIN_DICT_SIZE) &&
 	     (dict->subdict->size != MIN_DICT_SIZE)) ||
             ((dict->size != MIN_DICT_SIZE) &&
 	     (dict->subdict->size == MIN_DICT_SIZE)))
 	    skey = xmlDictComputeKey(dict->subdict, name, l);
 	else
 	    skey = okey;

 	key = skey % dict->subdict->size;
 	if (dict->subdict->dict[key].valid != 0) {
 	    xmlDictEntryPtr tmp;

 	    for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
 		 tmp = tmp->next) {
 #ifdef __GNUC__
 		if ((tmp->okey == skey) && (tmp->len == l)) {
 		    if (!memcmp(tmp->name, name, l))
 			return(tmp->name);
 		}
 #else
 		if ((tmp->okey == skey) && (tmp->len == l) &&
 		    (!xmlStrncmp(tmp->name, name, l)))
 		    return(tmp->name);
 #endif
 		nbi++;
 	    }
 #ifdef __GNUC__
 	    if ((tmp->okey == skey) && (tmp->len == l)) {
 		if (!memcmp(tmp->name, name, l))
 		    return(tmp->name);
 	    }
 #else
 	    if ((tmp->okey == skey) && (tmp->len == l) &&
 		(!xmlStrncmp(tmp->name, name, l)))
 		return(tmp->name);
 #endif
 	}
 	key = okey % dict->size;
     }

     ret = xmlDictAddString(dict, name, l);
     if (ret == NULL)
         return(NULL);
     if (insert == NULL) {
 	entry = &(dict->dict[key]);
     } else {
 	entry = xmlMalloc(sizeof(xmlDictEntry));
 	if (entry == NULL)
 	     return(NULL);
     }
     entry->name = ret;
     entry->len = l;
     entry->next = NULL;
     entry->valid = 1;
     entry->okey = okey;


     if (insert != NULL)
 	insert->next = entry;

     dict->nbElems++;

     if ((dict->nbElems > dict->size / MAX_FILL) ||
         (nbi > MAX_HASH_LEN)) {
         int newSize = dict->size > INT_MAX / GROWTH_FACTOR ?
                       INT_MAX :
                       GROWTH_FACTOR * dict->size;
 	if (xmlDictGrow(dict, newSize) != 0)
 	    return(NULL);
     }
     /* Note that entry may have been freed at this point by xmlDictGrow */

     return(ret);
 }

 /**
  * xmlDictExists:
  * @dict: the dictionary
  * @name: the name of the userdata
  * @len: the length of the name, if -1 it is recomputed
  *
  * Check if the @name exists in the dictionary @dict.
  *
  * Returns the internal copy of the name or NULL if not found.
  */
 const xmlChar *
 xmlDictExists(xmlDictPtr dict, const xmlChar *name, int len) {
     unsigned key, okey;
     xmlDictEntryPtr insert;
     size_t l;

     if ((dict == NULL) || (name == NULL))
 	return(NULL);

     if (len < 0)
         l = strlen((const char *) name);
     else
         l = len;
     if (((dict->limit > 0) && (l >= dict->limit)) ||
         (l > INT_MAX / 2))
         return(NULL);

     /*
      * Check for duplicate and insertion location.
      */
     okey = xmlDictComputeKey(dict, name, l);
     key = okey % dict->size;
     if (dict->dict[key].valid == 0) {
 	insert = NULL;
     } else {
 	for (insert = &(dict->dict[key]); insert->next != NULL;
 	     insert = insert->next) {
 #ifdef __GNUC__
 	    if ((insert->okey == okey) && (insert->len == l)) {
 		if (!memcmp(insert->name, name, l))
 		    return(insert->name);
 	    }
 #else
 	    if ((insert->okey == okey) && (insert->len == l) &&
 	        (!xmlStrncmp(insert->name, name, l)))
 		return(insert->name);
 #endif
 	}
 #ifdef __GNUC__
 	if ((insert->okey == okey) && (insert->len == l)) {
 	    if (!memcmp(insert->name, name, l))
 		return(insert->name);
 	}
 #else
 	if ((insert->okey == okey) && (insert->len == l) &&
 	    (!xmlStrncmp(insert->name, name, l)))
 	    return(insert->name);
 #endif
     }

     if (dict->subdict) {
         unsigned skey;

         /* we cannot always reuse the same okey for the subdict */
         if (((dict->size == MIN_DICT_SIZE) &&
 	     (dict->subdict->size != MIN_DICT_SIZE)) ||
             ((dict->size != MIN_DICT_SIZE) &&
 	     (dict->subdict->size == MIN_DICT_SIZE)))
 	    skey = xmlDictComputeKey(dict->subdict, name, l);
 	else
 	    skey = okey;

 	key = skey % dict->subdict->size;
 	if (dict->subdict->dict[key].valid != 0) {
 	    xmlDictEntryPtr tmp;

 	    for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
 		 tmp = tmp->next) {
 #ifdef __GNUC__
 		if ((tmp->okey == skey) && (tmp->len == l)) {
 		    if (!memcmp(tmp->name, name, l))
 			return(tmp->name);
 		}
 #else
 		if ((tmp->okey == skey) && (tmp->len == l) &&
 		    (!xmlStrncmp(tmp->name, name, l)))
 		    return(tmp->name);
 #endif
 	    }
 #ifdef __GNUC__
 	    if ((tmp->okey == skey) && (tmp->len == l)) {
 		if (!memcmp(tmp->name, name, l))
 		    return(tmp->name);
 	    }
 #else
 	    if ((tmp->okey == skey) && (tmp->len == l) &&
 		(!xmlStrncmp(tmp->name, name, l)))
 		return(tmp->name);
 #endif
 	}
     }

     /* not found */
     return(NULL);
 }

 /**
  * xmlDictQLookup:
  * @dict: the dictionary
  * @prefix: the prefix
  * @name: the name
  *
  * Add the QName @prefix:@name to the hash @dict if not present.
  *
  * Returns the internal copy of the QName or NULL in case of internal error
  */
 const xmlChar *
 xmlDictQLookup(xmlDictPtr dict, const xmlChar *prefix, const xmlChar *name) {
     unsigned okey, key, nbi = 0;
     xmlDictEntryPtr entry;
     xmlDictEntryPtr insert;
     const xmlChar *ret;
     size_t len, plen, l;

     if ((dict == NULL) || (name == NULL))
 	return(NULL);
     if (prefix == NULL)
         return(xmlDictLookup(dict, name, -1));

     l = len = strlen((const char *) name);
     plen = strlen((const char *) prefix);
     if ((len > INT_MAX / 2) || (plen > INT_MAX / 2))
         return(NULL);
     len += 1 + plen;

     /*
      * Check for duplicate and insertion location.
      */
     okey = xmlDictComputeQKey(dict, prefix, plen, name, l);
     key = okey % dict->size;
     if (dict->dict[key].valid == 0) {
 	insert = NULL;
     } else {
 	for (insert = &(dict->dict[key]); insert->next != NULL;
 	     insert = insert->next) {
 	    if ((insert->okey == okey) && (insert->len == len) &&
 	        (xmlStrQEqual(prefix, name, insert->name)))
 		return(insert->name);
 	    nbi++;
 	}
 	if ((insert->okey == okey) && (insert->len == len) &&
 	    (xmlStrQEqual(prefix, name, insert->name)))
 	    return(insert->name);
     }

     if (dict->subdict) {
         unsigned skey;

         /* we cannot always reuse the same okey for the subdict */
         if (((dict->size == MIN_DICT_SIZE) &&
 	     (dict->subdict->size != MIN_DICT_SIZE)) ||
             ((dict->size != MIN_DICT_SIZE) &&
 	     (dict->subdict->size == MIN_DICT_SIZE)))
 	    skey = xmlDictComputeQKey(dict->subdict, prefix, plen, name, l);
 	else
 	    skey = okey;

 	key = skey % dict->subdict->size;
 	if (dict->subdict->dict[key].valid != 0) {
 	    xmlDictEntryPtr tmp;
 	    for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL;
 		 tmp = tmp->next) {
 		if ((tmp->okey == skey) && (tmp->len == len) &&
 		    (xmlStrQEqual(prefix, name, tmp->name)))
 		    return(tmp->name);
 		nbi++;
 	    }
 	    if ((tmp->okey == skey) && (tmp->len == len) &&
 		(xmlStrQEqual(prefix, name, tmp->name)))
 		return(tmp->name);
 	}
 	key = okey % dict->size;
     }

     ret = xmlDictAddQString(dict, prefix, plen, name, l);
     if (ret == NULL)
         return(NULL);
     if (insert == NULL) {
 	entry = &(dict->dict[key]);
     } else {
 	entry = xmlMalloc(sizeof(xmlDictEntry));
 	if (entry == NULL)
 	     return(NULL);
     }
     entry->name = ret;
     entry->len = len;
     entry->next = NULL;
     entry->valid = 1;
     entry->okey = okey;

     if (insert != NULL)
 	insert->next = entry;

     dict->nbElems++;

     if ((dict->nbElems > dict->size / MAX_FILL) ||
         (nbi > MAX_HASH_LEN)) {
         int newSize = dict->size > INT_MAX / GROWTH_FACTOR ?
                       INT_MAX :
                       GROWTH_FACTOR * dict->size;
 	if (xmlDictGrow(dict, newSize) != 0)
 	    return(NULL);
     }
     /* Note that entry may have been freed at this point by xmlDictGrow */

     return(ret);
 }

 /**
  * xmlDictOwns:
  * @dict: the dictionary
  * @str: the string
  *
  * check if a string is owned by the dictionary
  *
  * Returns 1 if true, 0 if false and -1 in case of error
  * -1 in case of error
  */
 int
 xmlDictOwns(xmlDictPtr dict, const xmlChar *str) {
     xmlDictStringsPtr pool;

     if ((dict == NULL) || (str == NULL))
 	return(-1);
     pool = dict->strings;
     while (pool != NULL) {
         if ((str >= &pool->array[0]) && (str <= pool->free))
 	    return(1);
 	pool = pool->next;
     }
     if (dict->subdict)
         return(xmlDictOwns(dict->subdict, str));
     return(0);
 }

 /**
  * xmlDictSize:
  * @dict: the dictionary
  *
  * Query the number of elements installed in the hash @dict.
  *
  * Returns the number of elements in the dictionary or
  * -1 in case of error
  */
 int
 xmlDictSize(xmlDictPtr dict) {
     if (dict == NULL)
 	return(-1);
     if (dict->subdict)
         return(dict->nbElems + dict->subdict->nbElems);
     return(dict->nbElems);
 }

 /**
  * xmlDictSetLimit:
  * @dict: the dictionary
  * @limit: the limit in bytes
  *
  * Set a size limit for the dictionary
  * Added in 2.9.0
  *
  * Returns the previous limit of the dictionary or 0
  */
 size_t
 xmlDictSetLimit(xmlDictPtr dict, size_t limit) {
     size_t ret;

     if (dict == NULL)
 	return(0);
     ret = dict->limit;
     dict->limit = limit;
     return(ret);
 }

 /**
  * xmlDictGetUsage:
  * @dict: the dictionary
  *
  * Get how much memory is used by a dictionary for strings
  * Added in 2.9.0
  *
  * Returns the amount of strings allocated
  */
 size_t
 xmlDictGetUsage(xmlDictPtr dict) {
     xmlDictStringsPtr pool;
     size_t limit = 0;

     if (dict == NULL)
 	return(0);
     pool = dict->strings;
     while (pool != NULL) {
         limit += pool->size;
 	pool = pool->next;
     }
     return(limit);
 }