1 | /* |
2 | * dict.c: dictionary of reusable strings, just used to avoid allocation |
3 | * and freeing operations. |
4 | * |
5 | * Copyright (C) 2003-2012 Daniel Veillard. |
6 | * |
7 | * Permission to use, copy, modify, and distribute this software for any |
8 | * purpose with or without fee is hereby granted, provided that the above |
9 | * copyright notice and this permission notice appear in all copies. |
10 | * |
11 | * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR IMPLIED |
12 | * WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED WARRANTIES OF |
13 | * MERCHANTIBILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE AUTHORS AND |
14 | * CONTRIBUTORS ACCEPT NO RESPONSIBILITY IN ANY CONCEIVABLE MANNER. |
15 | * |
16 | * Author: daniel@veillard.com |
17 | */ |
18 | |
19 | #define IN_LIBXML |
20 | #include "libxml.h" |
21 | |
22 | #include <limits.h> |
23 | #ifdef HAVE_STDLIB_H |
24 | #include <stdlib.h> |
25 | #endif |
26 | #ifdef HAVE_TIME_H |
27 | #include <time.h> |
28 | #endif |
29 | |
30 | /* |
31 | * Following http://www.ocert.org/advisories/ocert-2011-003.html |
32 | * it seems that having hash randomization might be a good idea |
33 | * when using XML with untrusted data |
34 | * Note1: that it works correctly only if compiled with WITH_BIG_KEY |
35 | * which is the default. |
36 | * Note2: the fast function used for a small dict won't protect very |
37 | * well but since the attack is based on growing a very big hash |
38 | * list we will use the BigKey algo as soon as the hash size grows |
39 | * over MIN_DICT_SIZE so this actually works |
40 | */ |
41 | #if defined(HAVE_RAND) && defined(HAVE_SRAND) && defined(HAVE_TIME) |
42 | #define DICT_RANDOMIZATION |
43 | #endif |
44 | |
45 | #include <string.h> |
46 | #ifdef HAVE_STDINT_H |
47 | #include <stdint.h> |
48 | #else |
49 | #ifdef HAVE_INTTYPES_H |
50 | #include <inttypes.h> |
51 | #elif defined(_WIN32) |
52 | typedef unsigned __int32 uint32_t; |
53 | #endif |
54 | #endif |
55 | #include <libxml/tree.h> |
56 | #include <libxml/dict.h> |
57 | #include <libxml/xmlmemory.h> |
58 | #include <libxml/xmlerror.h> |
59 | #include <libxml/globals.h> |
60 | |
61 | /* #define DEBUG_GROW */ |
62 | /* #define DICT_DEBUG_PATTERNS */ |
63 | |
64 | #define MAX_HASH_LEN 3 |
65 | #define MIN_DICT_SIZE 128 |
66 | #define MAX_DICT_HASH 8 * 2048 |
67 | #define WITH_BIG_KEY |
68 | |
69 | #ifdef WITH_BIG_KEY |
70 | #define xmlDictComputeKey(dict, name, len) \ |
71 | (((dict)->size == MIN_DICT_SIZE) ? \ |
72 | xmlDictComputeFastKey(name, len, (dict)->seed) : \ |
73 | xmlDictComputeBigKey(name, len, (dict)->seed)) |
74 | |
75 | #define xmlDictComputeQKey(dict, prefix, plen, name, len) \ |
76 | (((prefix) == NULL) ? \ |
77 | (xmlDictComputeKey(dict, name, len)) : \ |
78 | (((dict)->size == MIN_DICT_SIZE) ? \ |
79 | xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed) : \ |
80 | xmlDictComputeBigQKey(prefix, plen, name, len, (dict)->seed))) |
81 | |
82 | #else /* !WITH_BIG_KEY */ |
83 | #define xmlDictComputeKey(dict, name, len) \ |
84 | xmlDictComputeFastKey(name, len, (dict)->seed) |
85 | #define xmlDictComputeQKey(dict, prefix, plen, name, len) \ |
86 | xmlDictComputeFastQKey(prefix, plen, name, len, (dict)->seed) |
87 | #endif /* WITH_BIG_KEY */ |
88 | |
89 | /* |
90 | * An entry in the dictionary |
91 | */ |
92 | typedef struct _xmlDictEntry xmlDictEntry; |
93 | typedef xmlDictEntry *xmlDictEntryPtr; |
94 | struct _xmlDictEntry { |
95 | struct _xmlDictEntry *next; |
96 | const xmlChar *name; |
97 | unsigned int len; |
98 | int valid; |
99 | unsigned long okey; |
100 | }; |
101 | |
102 | typedef struct _xmlDictStrings xmlDictStrings; |
103 | typedef xmlDictStrings *xmlDictStringsPtr; |
104 | struct _xmlDictStrings { |
105 | xmlDictStringsPtr next; |
106 | xmlChar *free; |
107 | xmlChar *end; |
108 | size_t size; |
109 | size_t nbStrings; |
110 | xmlChar array[1]; |
111 | }; |
112 | /* |
113 | * The entire dictionary |
114 | */ |
115 | struct _xmlDict { |
116 | int ref_counter; |
117 | |
118 | struct _xmlDictEntry *dict; |
119 | size_t size; |
120 | unsigned int nbElems; |
121 | xmlDictStringsPtr strings; |
122 | |
123 | struct _xmlDict *subdict; |
124 | /* used for randomization */ |
125 | int seed; |
126 | /* used to impose a limit on size */ |
127 | size_t limit; |
128 | }; |
129 | |
130 | /* |
131 | * A mutex for modifying the reference counter for shared |
132 | * dictionaries. |
133 | */ |
134 | static xmlRMutexPtr xmlDictMutex = NULL; |
135 | |
136 | /* |
137 | * Whether the dictionary mutex was initialized. |
138 | */ |
139 | static int xmlDictInitialized = 0; |
140 | |
141 | #ifdef DICT_RANDOMIZATION |
142 | #ifdef HAVE_RAND_R |
143 | /* |
144 | * Internal data for random function, protected by xmlDictMutex |
145 | */ |
146 | static unsigned int rand_seed = 0; |
147 | #endif |
148 | #endif |
149 | |
150 | /** |
151 | * xmlInitializeDict: |
152 | * |
153 | * Do the dictionary mutex initialization. |
154 | * this function is deprecated |
155 | * |
156 | * Returns 0 if initialization was already done, and 1 if that |
157 | * call led to the initialization |
158 | */ |
159 | int xmlInitializeDict(void) { |
160 | return(0); |
161 | } |
162 | |
163 | /** |
164 | * __xmlInitializeDict: |
165 | * |
166 | * This function is not public |
167 | * Do the dictionary mutex initialization. |
168 | * this function is not thread safe, initialization should |
169 | * normally be done once at setup when called from xmlOnceInit() |
170 | * we may also land in this code if thread support is not compiled in |
171 | * |
172 | * Returns 0 if initialization was already done, and 1 if that |
173 | * call led to the initialization |
174 | */ |
175 | int __xmlInitializeDict(void) { |
176 | if (xmlDictInitialized) |
177 | return(1); |
178 | |
179 | if ((xmlDictMutex = xmlNewRMutex()) == NULL) |
180 | return(0); |
181 | xmlRMutexLock(xmlDictMutex); |
182 | |
183 | #ifdef DICT_RANDOMIZATION |
184 | #ifdef HAVE_RAND_R |
185 | rand_seed = time(NULL); |
186 | rand_r(& rand_seed); |
187 | #else |
188 | srand(time(NULL)); |
189 | #endif |
190 | #endif |
191 | xmlDictInitialized = 1; |
192 | xmlRMutexUnlock(xmlDictMutex); |
193 | return(1); |
194 | } |
195 | |
196 | #ifdef DICT_RANDOMIZATION |
197 | int __xmlRandom(void) { |
198 | int ret; |
199 | |
200 | if (xmlDictInitialized == 0) |
201 | __xmlInitializeDict(); |
202 | |
203 | xmlRMutexLock(xmlDictMutex); |
204 | #ifdef HAVE_RAND_R |
205 | ret = rand_r(& rand_seed); |
206 | #else |
207 | ret = rand(); |
208 | #endif |
209 | xmlRMutexUnlock(xmlDictMutex); |
210 | return(ret); |
211 | } |
212 | #endif |
213 | |
214 | /** |
215 | * xmlDictCleanup: |
216 | * |
217 | * Free the dictionary mutex. Do not call unless sure the library |
218 | * is not in use anymore ! |
219 | */ |
220 | void |
221 | xmlDictCleanup(void) { |
222 | if (!xmlDictInitialized) |
223 | return; |
224 | |
225 | xmlFreeRMutex(xmlDictMutex); |
226 | |
227 | xmlDictInitialized = 0; |
228 | } |
229 | |
230 | /* |
231 | * xmlDictAddString: |
232 | * @dict: the dictionary |
233 | * @name: the name of the userdata |
234 | * @len: the length of the name |
235 | * |
236 | * Add the string to the array[s] |
237 | * |
238 | * Returns the pointer of the local string, or NULL in case of error. |
239 | */ |
240 | static const xmlChar * |
241 | xmlDictAddString(xmlDictPtr dict, const xmlChar *name, unsigned int namelen) { |
242 | xmlDictStringsPtr pool; |
243 | const xmlChar *ret; |
244 | size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */ |
245 | size_t limit = 0; |
246 | |
247 | #ifdef DICT_DEBUG_PATTERNS |
248 | fprintf(stderr, "-" ); |
249 | #endif |
250 | pool = dict->strings; |
251 | while (pool != NULL) { |
252 | if ((size_t)(pool->end - pool->free) > namelen) |
253 | goto found_pool; |
254 | if (pool->size > size) size = pool->size; |
255 | limit += pool->size; |
256 | pool = pool->next; |
257 | } |
258 | /* |
259 | * Not found, need to allocate |
260 | */ |
261 | if (pool == NULL) { |
262 | if ((dict->limit > 0) && (limit > dict->limit)) { |
263 | return(NULL); |
264 | } |
265 | |
266 | if (size == 0) size = 1000; |
267 | else size *= 4; /* exponential growth */ |
268 | if (size < 4 * namelen) |
269 | size = 4 * namelen; /* just in case ! */ |
270 | pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size); |
271 | if (pool == NULL) |
272 | return(NULL); |
273 | pool->size = size; |
274 | pool->nbStrings = 0; |
275 | pool->free = &pool->array[0]; |
276 | pool->end = &pool->array[size]; |
277 | pool->next = dict->strings; |
278 | dict->strings = pool; |
279 | #ifdef DICT_DEBUG_PATTERNS |
280 | fprintf(stderr, "+" ); |
281 | #endif |
282 | } |
283 | found_pool: |
284 | ret = pool->free; |
285 | memcpy(pool->free, name, namelen); |
286 | pool->free += namelen; |
287 | *(pool->free++) = 0; |
288 | pool->nbStrings++; |
289 | return(ret); |
290 | } |
291 | |
292 | /* |
293 | * xmlDictAddQString: |
294 | * @dict: the dictionary |
295 | * @prefix: the prefix of the userdata |
296 | * @plen: the prefix length |
297 | * @name: the name of the userdata |
298 | * @len: the length of the name |
299 | * |
300 | * Add the QName to the array[s] |
301 | * |
302 | * Returns the pointer of the local string, or NULL in case of error. |
303 | */ |
304 | static const xmlChar * |
305 | xmlDictAddQString(xmlDictPtr dict, const xmlChar *prefix, unsigned int plen, |
306 | const xmlChar *name, unsigned int namelen) |
307 | { |
308 | xmlDictStringsPtr pool; |
309 | const xmlChar *ret; |
310 | size_t size = 0; /* + sizeof(_xmlDictStrings) == 1024 */ |
311 | size_t limit = 0; |
312 | |
313 | if (prefix == NULL) return(xmlDictAddString(dict, name, namelen)); |
314 | |
315 | #ifdef DICT_DEBUG_PATTERNS |
316 | fprintf(stderr, "=" ); |
317 | #endif |
318 | pool = dict->strings; |
319 | while (pool != NULL) { |
320 | if ((size_t)(pool->end - pool->free) > namelen + plen + 1) |
321 | goto found_pool; |
322 | if (pool->size > size) size = pool->size; |
323 | limit += pool->size; |
324 | pool = pool->next; |
325 | } |
326 | /* |
327 | * Not found, need to allocate |
328 | */ |
329 | if (pool == NULL) { |
330 | if ((dict->limit > 0) && (limit > dict->limit)) { |
331 | return(NULL); |
332 | } |
333 | |
334 | if (size == 0) size = 1000; |
335 | else size *= 4; /* exponential growth */ |
336 | if (size < 4 * (namelen + plen + 1)) |
337 | size = 4 * (namelen + plen + 1); /* just in case ! */ |
338 | pool = (xmlDictStringsPtr) xmlMalloc(sizeof(xmlDictStrings) + size); |
339 | if (pool == NULL) |
340 | return(NULL); |
341 | pool->size = size; |
342 | pool->nbStrings = 0; |
343 | pool->free = &pool->array[0]; |
344 | pool->end = &pool->array[size]; |
345 | pool->next = dict->strings; |
346 | dict->strings = pool; |
347 | #ifdef DICT_DEBUG_PATTERNS |
348 | fprintf(stderr, "+" ); |
349 | #endif |
350 | } |
351 | found_pool: |
352 | ret = pool->free; |
353 | memcpy(pool->free, prefix, plen); |
354 | pool->free += plen; |
355 | *(pool->free++) = ':'; |
356 | memcpy(pool->free, name, namelen); |
357 | pool->free += namelen; |
358 | *(pool->free++) = 0; |
359 | pool->nbStrings++; |
360 | return(ret); |
361 | } |
362 | |
363 | #ifdef WITH_BIG_KEY |
364 | /* |
365 | * xmlDictComputeBigKey: |
366 | * |
367 | * Calculate a hash key using a good hash function that works well for |
368 | * larger hash table sizes. |
369 | * |
370 | * Hash function by "One-at-a-Time Hash" see |
371 | * http://burtleburtle.net/bob/hash/doobs.html |
372 | */ |
373 | |
374 | static uint32_t |
375 | xmlDictComputeBigKey(const xmlChar* data, int namelen, int seed) { |
376 | uint32_t hash; |
377 | int i; |
378 | |
379 | if (namelen <= 0 || data == NULL) return(0); |
380 | |
381 | hash = seed; |
382 | |
383 | for (i = 0;i < namelen; i++) { |
384 | hash += data[i]; |
385 | hash += (hash << 10); |
386 | hash ^= (hash >> 6); |
387 | } |
388 | hash += (hash << 3); |
389 | hash ^= (hash >> 11); |
390 | hash += (hash << 15); |
391 | |
392 | return hash; |
393 | } |
394 | |
395 | /* |
396 | * xmlDictComputeBigQKey: |
397 | * |
398 | * Calculate a hash key for two strings using a good hash function |
399 | * that works well for larger hash table sizes. |
400 | * |
401 | * Hash function by "One-at-a-Time Hash" see |
402 | * http://burtleburtle.net/bob/hash/doobs.html |
403 | * |
404 | * Neither of the two strings must be NULL. |
405 | */ |
406 | static unsigned long |
407 | xmlDictComputeBigQKey(const xmlChar *prefix, int plen, |
408 | const xmlChar *name, int len, int seed) |
409 | { |
410 | uint32_t hash; |
411 | int i; |
412 | |
413 | hash = seed; |
414 | |
415 | for (i = 0;i < plen; i++) { |
416 | hash += prefix[i]; |
417 | hash += (hash << 10); |
418 | hash ^= (hash >> 6); |
419 | } |
420 | hash += ':'; |
421 | hash += (hash << 10); |
422 | hash ^= (hash >> 6); |
423 | |
424 | for (i = 0;i < len; i++) { |
425 | hash += name[i]; |
426 | hash += (hash << 10); |
427 | hash ^= (hash >> 6); |
428 | } |
429 | hash += (hash << 3); |
430 | hash ^= (hash >> 11); |
431 | hash += (hash << 15); |
432 | |
433 | return hash; |
434 | } |
435 | #endif /* WITH_BIG_KEY */ |
436 | |
437 | /* |
438 | * xmlDictComputeFastKey: |
439 | * |
440 | * Calculate a hash key using a fast hash function that works well |
441 | * for low hash table fill. |
442 | */ |
443 | static unsigned long |
444 | xmlDictComputeFastKey(const xmlChar *name, int namelen, int seed) { |
445 | unsigned long value = seed; |
446 | |
447 | if (name == NULL) return(0); |
448 | value = *name; |
449 | value <<= 5; |
450 | if (namelen > 10) { |
451 | value += name[namelen - 1]; |
452 | namelen = 10; |
453 | } |
454 | switch (namelen) { |
455 | case 10: value += name[9]; |
456 | /* Falls through. */ |
457 | case 9: value += name[8]; |
458 | /* Falls through. */ |
459 | case 8: value += name[7]; |
460 | /* Falls through. */ |
461 | case 7: value += name[6]; |
462 | /* Falls through. */ |
463 | case 6: value += name[5]; |
464 | /* Falls through. */ |
465 | case 5: value += name[4]; |
466 | /* Falls through. */ |
467 | case 4: value += name[3]; |
468 | /* Falls through. */ |
469 | case 3: value += name[2]; |
470 | /* Falls through. */ |
471 | case 2: value += name[1]; |
472 | /* Falls through. */ |
473 | default: break; |
474 | } |
475 | return(value); |
476 | } |
477 | |
478 | /* |
479 | * xmlDictComputeFastQKey: |
480 | * |
481 | * Calculate a hash key for two strings using a fast hash function |
482 | * that works well for low hash table fill. |
483 | * |
484 | * Neither of the two strings must be NULL. |
485 | */ |
486 | static unsigned long |
487 | xmlDictComputeFastQKey(const xmlChar *prefix, int plen, |
488 | const xmlChar *name, int len, int seed) |
489 | { |
490 | unsigned long value = (unsigned long) seed; |
491 | |
492 | if (plen == 0) |
493 | value += 30 * (unsigned long) ':'; |
494 | else |
495 | value += 30 * (*prefix); |
496 | |
497 | if (len > 10) { |
498 | int offset = len - (plen + 1 + 1); |
499 | if (offset < 0) |
500 | offset = len - (10 + 1); |
501 | value += name[offset]; |
502 | len = 10; |
503 | if (plen > 10) |
504 | plen = 10; |
505 | } |
506 | switch (plen) { |
507 | case 10: value += prefix[9]; |
508 | /* Falls through. */ |
509 | case 9: value += prefix[8]; |
510 | /* Falls through. */ |
511 | case 8: value += prefix[7]; |
512 | /* Falls through. */ |
513 | case 7: value += prefix[6]; |
514 | /* Falls through. */ |
515 | case 6: value += prefix[5]; |
516 | /* Falls through. */ |
517 | case 5: value += prefix[4]; |
518 | /* Falls through. */ |
519 | case 4: value += prefix[3]; |
520 | /* Falls through. */ |
521 | case 3: value += prefix[2]; |
522 | /* Falls through. */ |
523 | case 2: value += prefix[1]; |
524 | /* Falls through. */ |
525 | case 1: value += prefix[0]; |
526 | /* Falls through. */ |
527 | default: break; |
528 | } |
529 | len -= plen; |
530 | if (len > 0) { |
531 | value += (unsigned long) ':'; |
532 | len--; |
533 | } |
534 | switch (len) { |
535 | case 10: value += name[9]; |
536 | /* Falls through. */ |
537 | case 9: value += name[8]; |
538 | /* Falls through. */ |
539 | case 8: value += name[7]; |
540 | /* Falls through. */ |
541 | case 7: value += name[6]; |
542 | /* Falls through. */ |
543 | case 6: value += name[5]; |
544 | /* Falls through. */ |
545 | case 5: value += name[4]; |
546 | /* Falls through. */ |
547 | case 4: value += name[3]; |
548 | /* Falls through. */ |
549 | case 3: value += name[2]; |
550 | /* Falls through. */ |
551 | case 2: value += name[1]; |
552 | /* Falls through. */ |
553 | case 1: value += name[0]; |
554 | /* Falls through. */ |
555 | default: break; |
556 | } |
557 | return(value); |
558 | } |
559 | |
560 | /** |
561 | * xmlDictCreate: |
562 | * |
563 | * Create a new dictionary |
564 | * |
565 | * Returns the newly created dictionary, or NULL if an error occurred. |
566 | */ |
567 | xmlDictPtr |
568 | xmlDictCreate(void) { |
569 | xmlDictPtr dict; |
570 | |
571 | if (!xmlDictInitialized) |
572 | if (!__xmlInitializeDict()) |
573 | return(NULL); |
574 | |
575 | #ifdef DICT_DEBUG_PATTERNS |
576 | fprintf(stderr, "C" ); |
577 | #endif |
578 | |
579 | dict = xmlMalloc(sizeof(xmlDict)); |
580 | if (dict) { |
581 | dict->ref_counter = 1; |
582 | dict->limit = 0; |
583 | |
584 | dict->size = MIN_DICT_SIZE; |
585 | dict->nbElems = 0; |
586 | dict->dict = xmlMalloc(MIN_DICT_SIZE * sizeof(xmlDictEntry)); |
587 | dict->strings = NULL; |
588 | dict->subdict = NULL; |
589 | if (dict->dict) { |
590 | memset(dict->dict, 0, MIN_DICT_SIZE * sizeof(xmlDictEntry)); |
591 | #ifdef DICT_RANDOMIZATION |
592 | dict->seed = __xmlRandom(); |
593 | #else |
594 | dict->seed = 0; |
595 | #endif |
596 | return(dict); |
597 | } |
598 | xmlFree(dict); |
599 | } |
600 | return(NULL); |
601 | } |
602 | |
603 | /** |
604 | * xmlDictCreateSub: |
605 | * @sub: an existing dictionary |
606 | * |
607 | * Create a new dictionary, inheriting strings from the read-only |
608 | * dictionary @sub. On lookup, strings are first searched in the |
609 | * new dictionary, then in @sub, and if not found are created in the |
610 | * new dictionary. |
611 | * |
612 | * Returns the newly created dictionary, or NULL if an error occurred. |
613 | */ |
614 | xmlDictPtr |
615 | xmlDictCreateSub(xmlDictPtr sub) { |
616 | xmlDictPtr dict = xmlDictCreate(); |
617 | |
618 | if ((dict != NULL) && (sub != NULL)) { |
619 | #ifdef DICT_DEBUG_PATTERNS |
620 | fprintf(stderr, "R" ); |
621 | #endif |
622 | dict->seed = sub->seed; |
623 | dict->subdict = sub; |
624 | xmlDictReference(dict->subdict); |
625 | } |
626 | return(dict); |
627 | } |
628 | |
629 | /** |
630 | * xmlDictReference: |
631 | * @dict: the dictionary |
632 | * |
633 | * Increment the reference counter of a dictionary |
634 | * |
635 | * Returns 0 in case of success and -1 in case of error |
636 | */ |
637 | int |
638 | xmlDictReference(xmlDictPtr dict) { |
639 | if (!xmlDictInitialized) |
640 | if (!__xmlInitializeDict()) |
641 | return(-1); |
642 | |
643 | if (dict == NULL) return -1; |
644 | xmlRMutexLock(xmlDictMutex); |
645 | dict->ref_counter++; |
646 | xmlRMutexUnlock(xmlDictMutex); |
647 | return(0); |
648 | } |
649 | |
650 | /** |
651 | * xmlDictGrow: |
652 | * @dict: the dictionary |
653 | * @size: the new size of the dictionary |
654 | * |
655 | * resize the dictionary |
656 | * |
657 | * Returns 0 in case of success, -1 in case of failure |
658 | */ |
659 | static int |
660 | xmlDictGrow(xmlDictPtr dict, size_t size) { |
661 | unsigned long key, okey; |
662 | size_t oldsize, i; |
663 | xmlDictEntryPtr iter, next; |
664 | struct _xmlDictEntry *olddict; |
665 | #ifdef DEBUG_GROW |
666 | unsigned long nbElem = 0; |
667 | #endif |
668 | int ret = 0; |
669 | int keep_keys = 1; |
670 | |
671 | if (dict == NULL) |
672 | return(-1); |
673 | if (size < 8) |
674 | return(-1); |
675 | if (size > 8 * 2048) |
676 | return(-1); |
677 | |
678 | #ifdef DICT_DEBUG_PATTERNS |
679 | fprintf(stderr, "*" ); |
680 | #endif |
681 | |
682 | oldsize = dict->size; |
683 | olddict = dict->dict; |
684 | if (olddict == NULL) |
685 | return(-1); |
686 | if (oldsize == MIN_DICT_SIZE) |
687 | keep_keys = 0; |
688 | |
689 | dict->dict = xmlMalloc(size * sizeof(xmlDictEntry)); |
690 | if (dict->dict == NULL) { |
691 | dict->dict = olddict; |
692 | return(-1); |
693 | } |
694 | memset(dict->dict, 0, size * sizeof(xmlDictEntry)); |
695 | dict->size = size; |
696 | |
697 | /* If the two loops are merged, there would be situations where |
698 | a new entry needs to allocated and data copied into it from |
699 | the main dict. It is nicer to run through the array twice, first |
700 | copying all the elements in the main array (less probability of |
701 | allocate) and then the rest, so we only free in the second loop. |
702 | */ |
703 | for (i = 0; i < oldsize; i++) { |
704 | if (olddict[i].valid == 0) |
705 | continue; |
706 | |
707 | if (keep_keys) |
708 | okey = olddict[i].okey; |
709 | else |
710 | okey = xmlDictComputeKey(dict, olddict[i].name, olddict[i].len); |
711 | key = okey % dict->size; |
712 | |
713 | if (dict->dict[key].valid == 0) { |
714 | memcpy(&(dict->dict[key]), &(olddict[i]), sizeof(xmlDictEntry)); |
715 | dict->dict[key].next = NULL; |
716 | dict->dict[key].okey = okey; |
717 | } else { |
718 | xmlDictEntryPtr entry; |
719 | |
720 | entry = xmlMalloc(sizeof(xmlDictEntry)); |
721 | if (entry != NULL) { |
722 | entry->name = olddict[i].name; |
723 | entry->len = olddict[i].len; |
724 | entry->okey = okey; |
725 | entry->next = dict->dict[key].next; |
726 | entry->valid = 1; |
727 | dict->dict[key].next = entry; |
728 | } else { |
729 | /* |
730 | * we don't have much ways to alert from herei |
731 | * result is losing an entry and unicity guarantee |
732 | */ |
733 | ret = -1; |
734 | } |
735 | } |
736 | #ifdef DEBUG_GROW |
737 | nbElem++; |
738 | #endif |
739 | } |
740 | |
741 | for (i = 0; i < oldsize; i++) { |
742 | iter = olddict[i].next; |
743 | while (iter) { |
744 | next = iter->next; |
745 | |
746 | /* |
747 | * put back the entry in the new dict |
748 | */ |
749 | |
750 | if (keep_keys) |
751 | okey = iter->okey; |
752 | else |
753 | okey = xmlDictComputeKey(dict, iter->name, iter->len); |
754 | key = okey % dict->size; |
755 | if (dict->dict[key].valid == 0) { |
756 | memcpy(&(dict->dict[key]), iter, sizeof(xmlDictEntry)); |
757 | dict->dict[key].next = NULL; |
758 | dict->dict[key].valid = 1; |
759 | dict->dict[key].okey = okey; |
760 | xmlFree(iter); |
761 | } else { |
762 | iter->next = dict->dict[key].next; |
763 | iter->okey = okey; |
764 | dict->dict[key].next = iter; |
765 | } |
766 | |
767 | #ifdef DEBUG_GROW |
768 | nbElem++; |
769 | #endif |
770 | |
771 | iter = next; |
772 | } |
773 | } |
774 | |
775 | xmlFree(olddict); |
776 | |
777 | #ifdef DEBUG_GROW |
778 | xmlGenericError(xmlGenericErrorContext, |
779 | "xmlDictGrow : from %lu to %lu, %u elems\n" , oldsize, size, nbElem); |
780 | #endif |
781 | |
782 | return(ret); |
783 | } |
784 | |
785 | /** |
786 | * xmlDictFree: |
787 | * @dict: the dictionary |
788 | * |
789 | * Free the hash @dict and its contents. The userdata is |
790 | * deallocated with @f if provided. |
791 | */ |
792 | void |
793 | xmlDictFree(xmlDictPtr dict) { |
794 | size_t i; |
795 | xmlDictEntryPtr iter; |
796 | xmlDictEntryPtr next; |
797 | int inside_dict = 0; |
798 | xmlDictStringsPtr pool, nextp; |
799 | |
800 | if (dict == NULL) |
801 | return; |
802 | |
803 | if (!xmlDictInitialized) |
804 | if (!__xmlInitializeDict()) |
805 | return; |
806 | |
807 | /* decrement the counter, it may be shared by a parser and docs */ |
808 | xmlRMutexLock(xmlDictMutex); |
809 | dict->ref_counter--; |
810 | if (dict->ref_counter > 0) { |
811 | xmlRMutexUnlock(xmlDictMutex); |
812 | return; |
813 | } |
814 | |
815 | xmlRMutexUnlock(xmlDictMutex); |
816 | |
817 | if (dict->subdict != NULL) { |
818 | xmlDictFree(dict->subdict); |
819 | } |
820 | |
821 | if (dict->dict) { |
822 | for(i = 0; ((i < dict->size) && (dict->nbElems > 0)); i++) { |
823 | iter = &(dict->dict[i]); |
824 | if (iter->valid == 0) |
825 | continue; |
826 | inside_dict = 1; |
827 | while (iter) { |
828 | next = iter->next; |
829 | if (!inside_dict) |
830 | xmlFree(iter); |
831 | dict->nbElems--; |
832 | inside_dict = 0; |
833 | iter = next; |
834 | } |
835 | } |
836 | xmlFree(dict->dict); |
837 | } |
838 | pool = dict->strings; |
839 | while (pool != NULL) { |
840 | nextp = pool->next; |
841 | xmlFree(pool); |
842 | pool = nextp; |
843 | } |
844 | xmlFree(dict); |
845 | } |
846 | |
847 | /** |
848 | * xmlDictLookup: |
849 | * @dict: the dictionary |
850 | * @name: the name of the userdata |
851 | * @len: the length of the name, if -1 it is recomputed |
852 | * |
853 | * Add the @name to the dictionary @dict if not present. |
854 | * |
855 | * Returns the internal copy of the name or NULL in case of internal error |
856 | */ |
857 | const xmlChar * |
858 | xmlDictLookup(xmlDictPtr dict, const xmlChar *name, int len) { |
859 | unsigned long key, okey, nbi = 0; |
860 | xmlDictEntryPtr entry; |
861 | xmlDictEntryPtr insert; |
862 | const xmlChar *ret; |
863 | unsigned int l; |
864 | |
865 | if ((dict == NULL) || (name == NULL)) |
866 | return(NULL); |
867 | |
868 | if (len < 0) |
869 | l = strlen((const char *) name); |
870 | else |
871 | l = len; |
872 | |
873 | if (((dict->limit > 0) && (l >= dict->limit)) || |
874 | (l > INT_MAX / 2)) |
875 | return(NULL); |
876 | |
877 | /* |
878 | * Check for duplicate and insertion location. |
879 | */ |
880 | okey = xmlDictComputeKey(dict, name, l); |
881 | key = okey % dict->size; |
882 | if (dict->dict[key].valid == 0) { |
883 | insert = NULL; |
884 | } else { |
885 | for (insert = &(dict->dict[key]); insert->next != NULL; |
886 | insert = insert->next) { |
887 | #ifdef __GNUC__ |
888 | if ((insert->okey == okey) && (insert->len == l)) { |
889 | if (!memcmp(insert->name, name, l)) |
890 | return(insert->name); |
891 | } |
892 | #else |
893 | if ((insert->okey == okey) && (insert->len == l) && |
894 | (!xmlStrncmp(insert->name, name, l))) |
895 | return(insert->name); |
896 | #endif |
897 | nbi++; |
898 | } |
899 | #ifdef __GNUC__ |
900 | if ((insert->okey == okey) && (insert->len == l)) { |
901 | if (!memcmp(insert->name, name, l)) |
902 | return(insert->name); |
903 | } |
904 | #else |
905 | if ((insert->okey == okey) && (insert->len == l) && |
906 | (!xmlStrncmp(insert->name, name, l))) |
907 | return(insert->name); |
908 | #endif |
909 | } |
910 | |
911 | if (dict->subdict) { |
912 | unsigned long skey; |
913 | |
914 | /* we cannot always reuse the same okey for the subdict */ |
915 | if (((dict->size == MIN_DICT_SIZE) && |
916 | (dict->subdict->size != MIN_DICT_SIZE)) || |
917 | ((dict->size != MIN_DICT_SIZE) && |
918 | (dict->subdict->size == MIN_DICT_SIZE))) |
919 | skey = xmlDictComputeKey(dict->subdict, name, l); |
920 | else |
921 | skey = okey; |
922 | |
923 | key = skey % dict->subdict->size; |
924 | if (dict->subdict->dict[key].valid != 0) { |
925 | xmlDictEntryPtr tmp; |
926 | |
927 | for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL; |
928 | tmp = tmp->next) { |
929 | #ifdef __GNUC__ |
930 | if ((tmp->okey == skey) && (tmp->len == l)) { |
931 | if (!memcmp(tmp->name, name, l)) |
932 | return(tmp->name); |
933 | } |
934 | #else |
935 | if ((tmp->okey == skey) && (tmp->len == l) && |
936 | (!xmlStrncmp(tmp->name, name, l))) |
937 | return(tmp->name); |
938 | #endif |
939 | nbi++; |
940 | } |
941 | #ifdef __GNUC__ |
942 | if ((tmp->okey == skey) && (tmp->len == l)) { |
943 | if (!memcmp(tmp->name, name, l)) |
944 | return(tmp->name); |
945 | } |
946 | #else |
947 | if ((tmp->okey == skey) && (tmp->len == l) && |
948 | (!xmlStrncmp(tmp->name, name, l))) |
949 | return(tmp->name); |
950 | #endif |
951 | } |
952 | key = okey % dict->size; |
953 | } |
954 | |
955 | ret = xmlDictAddString(dict, name, l); |
956 | if (ret == NULL) |
957 | return(NULL); |
958 | if (insert == NULL) { |
959 | entry = &(dict->dict[key]); |
960 | } else { |
961 | entry = xmlMalloc(sizeof(xmlDictEntry)); |
962 | if (entry == NULL) |
963 | return(NULL); |
964 | } |
965 | entry->name = ret; |
966 | entry->len = l; |
967 | entry->next = NULL; |
968 | entry->valid = 1; |
969 | entry->okey = okey; |
970 | |
971 | |
972 | if (insert != NULL) |
973 | insert->next = entry; |
974 | |
975 | dict->nbElems++; |
976 | |
977 | if ((nbi > MAX_HASH_LEN) && |
978 | (dict->size <= ((MAX_DICT_HASH / 2) / MAX_HASH_LEN))) { |
979 | if (xmlDictGrow(dict, MAX_HASH_LEN * 2 * dict->size) != 0) |
980 | return(NULL); |
981 | } |
982 | /* Note that entry may have been freed at this point by xmlDictGrow */ |
983 | |
984 | return(ret); |
985 | } |
986 | |
987 | /** |
988 | * xmlDictExists: |
989 | * @dict: the dictionary |
990 | * @name: the name of the userdata |
991 | * @len: the length of the name, if -1 it is recomputed |
992 | * |
993 | * Check if the @name exists in the dictionary @dict. |
994 | * |
995 | * Returns the internal copy of the name or NULL if not found. |
996 | */ |
997 | const xmlChar * |
998 | xmlDictExists(xmlDictPtr dict, const xmlChar *name, int len) { |
999 | unsigned long key, okey, nbi = 0; |
1000 | xmlDictEntryPtr insert; |
1001 | unsigned int l; |
1002 | |
1003 | if ((dict == NULL) || (name == NULL)) |
1004 | return(NULL); |
1005 | |
1006 | if (len < 0) |
1007 | l = strlen((const char *) name); |
1008 | else |
1009 | l = len; |
1010 | if (((dict->limit > 0) && (l >= dict->limit)) || |
1011 | (l > INT_MAX / 2)) |
1012 | return(NULL); |
1013 | |
1014 | /* |
1015 | * Check for duplicate and insertion location. |
1016 | */ |
1017 | okey = xmlDictComputeKey(dict, name, l); |
1018 | key = okey % dict->size; |
1019 | if (dict->dict[key].valid == 0) { |
1020 | insert = NULL; |
1021 | } else { |
1022 | for (insert = &(dict->dict[key]); insert->next != NULL; |
1023 | insert = insert->next) { |
1024 | #ifdef __GNUC__ |
1025 | if ((insert->okey == okey) && (insert->len == l)) { |
1026 | if (!memcmp(insert->name, name, l)) |
1027 | return(insert->name); |
1028 | } |
1029 | #else |
1030 | if ((insert->okey == okey) && (insert->len == l) && |
1031 | (!xmlStrncmp(insert->name, name, l))) |
1032 | return(insert->name); |
1033 | #endif |
1034 | nbi++; |
1035 | } |
1036 | #ifdef __GNUC__ |
1037 | if ((insert->okey == okey) && (insert->len == l)) { |
1038 | if (!memcmp(insert->name, name, l)) |
1039 | return(insert->name); |
1040 | } |
1041 | #else |
1042 | if ((insert->okey == okey) && (insert->len == l) && |
1043 | (!xmlStrncmp(insert->name, name, l))) |
1044 | return(insert->name); |
1045 | #endif |
1046 | } |
1047 | |
1048 | if (dict->subdict) { |
1049 | unsigned long skey; |
1050 | |
1051 | /* we cannot always reuse the same okey for the subdict */ |
1052 | if (((dict->size == MIN_DICT_SIZE) && |
1053 | (dict->subdict->size != MIN_DICT_SIZE)) || |
1054 | ((dict->size != MIN_DICT_SIZE) && |
1055 | (dict->subdict->size == MIN_DICT_SIZE))) |
1056 | skey = xmlDictComputeKey(dict->subdict, name, l); |
1057 | else |
1058 | skey = okey; |
1059 | |
1060 | key = skey % dict->subdict->size; |
1061 | if (dict->subdict->dict[key].valid != 0) { |
1062 | xmlDictEntryPtr tmp; |
1063 | |
1064 | for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL; |
1065 | tmp = tmp->next) { |
1066 | #ifdef __GNUC__ |
1067 | if ((tmp->okey == skey) && (tmp->len == l)) { |
1068 | if (!memcmp(tmp->name, name, l)) |
1069 | return(tmp->name); |
1070 | } |
1071 | #else |
1072 | if ((tmp->okey == skey) && (tmp->len == l) && |
1073 | (!xmlStrncmp(tmp->name, name, l))) |
1074 | return(tmp->name); |
1075 | #endif |
1076 | nbi++; |
1077 | } |
1078 | #ifdef __GNUC__ |
1079 | if ((tmp->okey == skey) && (tmp->len == l)) { |
1080 | if (!memcmp(tmp->name, name, l)) |
1081 | return(tmp->name); |
1082 | } |
1083 | #else |
1084 | if ((tmp->okey == skey) && (tmp->len == l) && |
1085 | (!xmlStrncmp(tmp->name, name, l))) |
1086 | return(tmp->name); |
1087 | #endif |
1088 | } |
1089 | } |
1090 | |
1091 | /* not found */ |
1092 | return(NULL); |
1093 | } |
1094 | |
1095 | /** |
1096 | * xmlDictQLookup: |
1097 | * @dict: the dictionary |
1098 | * @prefix: the prefix |
1099 | * @name: the name |
1100 | * |
1101 | * Add the QName @prefix:@name to the hash @dict if not present. |
1102 | * |
1103 | * Returns the internal copy of the QName or NULL in case of internal error |
1104 | */ |
1105 | const xmlChar * |
1106 | xmlDictQLookup(xmlDictPtr dict, const xmlChar *prefix, const xmlChar *name) { |
1107 | unsigned long okey, key, nbi = 0; |
1108 | xmlDictEntryPtr entry; |
1109 | xmlDictEntryPtr insert; |
1110 | const xmlChar *ret; |
1111 | unsigned int len, plen, l; |
1112 | |
1113 | if ((dict == NULL) || (name == NULL)) |
1114 | return(NULL); |
1115 | if (prefix == NULL) |
1116 | return(xmlDictLookup(dict, name, -1)); |
1117 | |
1118 | l = len = strlen((const char *) name); |
1119 | plen = strlen((const char *) prefix); |
1120 | len += 1 + plen; |
1121 | |
1122 | /* |
1123 | * Check for duplicate and insertion location. |
1124 | */ |
1125 | okey = xmlDictComputeQKey(dict, prefix, plen, name, l); |
1126 | key = okey % dict->size; |
1127 | if (dict->dict[key].valid == 0) { |
1128 | insert = NULL; |
1129 | } else { |
1130 | for (insert = &(dict->dict[key]); insert->next != NULL; |
1131 | insert = insert->next) { |
1132 | if ((insert->okey == okey) && (insert->len == len) && |
1133 | (xmlStrQEqual(prefix, name, insert->name))) |
1134 | return(insert->name); |
1135 | nbi++; |
1136 | } |
1137 | if ((insert->okey == okey) && (insert->len == len) && |
1138 | (xmlStrQEqual(prefix, name, insert->name))) |
1139 | return(insert->name); |
1140 | } |
1141 | |
1142 | if (dict->subdict) { |
1143 | unsigned long skey; |
1144 | |
1145 | /* we cannot always reuse the same okey for the subdict */ |
1146 | if (((dict->size == MIN_DICT_SIZE) && |
1147 | (dict->subdict->size != MIN_DICT_SIZE)) || |
1148 | ((dict->size != MIN_DICT_SIZE) && |
1149 | (dict->subdict->size == MIN_DICT_SIZE))) |
1150 | skey = xmlDictComputeQKey(dict->subdict, prefix, plen, name, l); |
1151 | else |
1152 | skey = okey; |
1153 | |
1154 | key = skey % dict->subdict->size; |
1155 | if (dict->subdict->dict[key].valid != 0) { |
1156 | xmlDictEntryPtr tmp; |
1157 | for (tmp = &(dict->subdict->dict[key]); tmp->next != NULL; |
1158 | tmp = tmp->next) { |
1159 | if ((tmp->okey == skey) && (tmp->len == len) && |
1160 | (xmlStrQEqual(prefix, name, tmp->name))) |
1161 | return(tmp->name); |
1162 | nbi++; |
1163 | } |
1164 | if ((tmp->okey == skey) && (tmp->len == len) && |
1165 | (xmlStrQEqual(prefix, name, tmp->name))) |
1166 | return(tmp->name); |
1167 | } |
1168 | key = okey % dict->size; |
1169 | } |
1170 | |
1171 | ret = xmlDictAddQString(dict, prefix, plen, name, l); |
1172 | if (ret == NULL) |
1173 | return(NULL); |
1174 | if (insert == NULL) { |
1175 | entry = &(dict->dict[key]); |
1176 | } else { |
1177 | entry = xmlMalloc(sizeof(xmlDictEntry)); |
1178 | if (entry == NULL) |
1179 | return(NULL); |
1180 | } |
1181 | entry->name = ret; |
1182 | entry->len = len; |
1183 | entry->next = NULL; |
1184 | entry->valid = 1; |
1185 | entry->okey = okey; |
1186 | |
1187 | if (insert != NULL) |
1188 | insert->next = entry; |
1189 | |
1190 | dict->nbElems++; |
1191 | |
1192 | if ((nbi > MAX_HASH_LEN) && |
1193 | (dict->size <= ((MAX_DICT_HASH / 2) / MAX_HASH_LEN))) |
1194 | xmlDictGrow(dict, MAX_HASH_LEN * 2 * dict->size); |
1195 | /* Note that entry may have been freed at this point by xmlDictGrow */ |
1196 | |
1197 | return(ret); |
1198 | } |
1199 | |
1200 | /** |
1201 | * xmlDictOwns: |
1202 | * @dict: the dictionary |
1203 | * @str: the string |
1204 | * |
1205 | * check if a string is owned by the disctionary |
1206 | * |
1207 | * Returns 1 if true, 0 if false and -1 in case of error |
1208 | * -1 in case of error |
1209 | */ |
1210 | int |
1211 | xmlDictOwns(xmlDictPtr dict, const xmlChar *str) { |
1212 | xmlDictStringsPtr pool; |
1213 | |
1214 | if ((dict == NULL) || (str == NULL)) |
1215 | return(-1); |
1216 | pool = dict->strings; |
1217 | while (pool != NULL) { |
1218 | if ((str >= &pool->array[0]) && (str <= pool->free)) |
1219 | return(1); |
1220 | pool = pool->next; |
1221 | } |
1222 | if (dict->subdict) |
1223 | return(xmlDictOwns(dict->subdict, str)); |
1224 | return(0); |
1225 | } |
1226 | |
1227 | /** |
1228 | * xmlDictSize: |
1229 | * @dict: the dictionary |
1230 | * |
1231 | * Query the number of elements installed in the hash @dict. |
1232 | * |
1233 | * Returns the number of elements in the dictionary or |
1234 | * -1 in case of error |
1235 | */ |
1236 | int |
1237 | xmlDictSize(xmlDictPtr dict) { |
1238 | if (dict == NULL) |
1239 | return(-1); |
1240 | if (dict->subdict) |
1241 | return(dict->nbElems + dict->subdict->nbElems); |
1242 | return(dict->nbElems); |
1243 | } |
1244 | |
1245 | /** |
1246 | * xmlDictSetLimit: |
1247 | * @dict: the dictionary |
1248 | * @limit: the limit in bytes |
1249 | * |
1250 | * Set a size limit for the dictionary |
1251 | * Added in 2.9.0 |
1252 | * |
1253 | * Returns the previous limit of the dictionary or 0 |
1254 | */ |
1255 | size_t |
1256 | xmlDictSetLimit(xmlDictPtr dict, size_t limit) { |
1257 | size_t ret; |
1258 | |
1259 | if (dict == NULL) |
1260 | return(0); |
1261 | ret = dict->limit; |
1262 | dict->limit = limit; |
1263 | return(ret); |
1264 | } |
1265 | |
1266 | /** |
1267 | * xmlDictGetUsage: |
1268 | * @dict: the dictionary |
1269 | * |
1270 | * Get how much memory is used by a dictionary for strings |
1271 | * Added in 2.9.0 |
1272 | * |
1273 | * Returns the amount of strings allocated |
1274 | */ |
1275 | size_t |
1276 | xmlDictGetUsage(xmlDictPtr dict) { |
1277 | xmlDictStringsPtr pool; |
1278 | size_t limit = 0; |
1279 | |
1280 | if (dict == NULL) |
1281 | return(0); |
1282 | pool = dict->strings; |
1283 | while (pool != NULL) { |
1284 | limit += pool->size; |
1285 | pool = pool->next; |
1286 | } |
1287 | return(limit); |
1288 | } |
1289 | |
1290 | #define bottom_dict |
1291 | #include "elfgcchack.h" |
1292 | |