1 | /* |
2 | * entities.c : implementation for the XML entities handling |
3 | * |
4 | * See Copyright for the status of this software. |
5 | * |
6 | * daniel@veillard.com |
7 | */ |
8 | |
9 | /* To avoid EBCDIC trouble when parsing on zOS */ |
10 | #if defined(__MVS__) |
11 | #pragma convert("ISO8859-1") |
12 | #endif |
13 | |
14 | #define IN_LIBXML |
15 | #include "libxml.h" |
16 | |
17 | #include <string.h> |
18 | #ifdef HAVE_STDLIB_H |
19 | #include <stdlib.h> |
20 | #endif |
21 | #include <libxml/xmlmemory.h> |
22 | #include <libxml/hash.h> |
23 | #include <libxml/entities.h> |
24 | #include <libxml/parser.h> |
25 | #include <libxml/parserInternals.h> |
26 | #include <libxml/xmlerror.h> |
27 | #include <libxml/globals.h> |
28 | #include <libxml/dict.h> |
29 | |
30 | #include "save.h" |
31 | |
32 | /* |
33 | * The XML predefined entities. |
34 | */ |
35 | |
36 | static xmlEntity xmlEntityLt = { |
37 | NULL, XML_ENTITY_DECL, BAD_CAST "lt" , |
38 | NULL, NULL, NULL, NULL, NULL, NULL, |
39 | BAD_CAST "<" , BAD_CAST "<" , 1, |
40 | XML_INTERNAL_PREDEFINED_ENTITY, |
41 | NULL, NULL, NULL, NULL, 0, 1 |
42 | }; |
43 | static xmlEntity xmlEntityGt = { |
44 | NULL, XML_ENTITY_DECL, BAD_CAST "gt" , |
45 | NULL, NULL, NULL, NULL, NULL, NULL, |
46 | BAD_CAST ">" , BAD_CAST ">" , 1, |
47 | XML_INTERNAL_PREDEFINED_ENTITY, |
48 | NULL, NULL, NULL, NULL, 0, 1 |
49 | }; |
50 | static xmlEntity xmlEntityAmp = { |
51 | NULL, XML_ENTITY_DECL, BAD_CAST "amp" , |
52 | NULL, NULL, NULL, NULL, NULL, NULL, |
53 | BAD_CAST "&" , BAD_CAST "&" , 1, |
54 | XML_INTERNAL_PREDEFINED_ENTITY, |
55 | NULL, NULL, NULL, NULL, 0, 1 |
56 | }; |
57 | static xmlEntity xmlEntityQuot = { |
58 | NULL, XML_ENTITY_DECL, BAD_CAST "quot" , |
59 | NULL, NULL, NULL, NULL, NULL, NULL, |
60 | BAD_CAST "\"" , BAD_CAST "\"" , 1, |
61 | XML_INTERNAL_PREDEFINED_ENTITY, |
62 | NULL, NULL, NULL, NULL, 0, 1 |
63 | }; |
64 | static xmlEntity xmlEntityApos = { |
65 | NULL, XML_ENTITY_DECL, BAD_CAST "apos" , |
66 | NULL, NULL, NULL, NULL, NULL, NULL, |
67 | BAD_CAST "'" , BAD_CAST "'" , 1, |
68 | XML_INTERNAL_PREDEFINED_ENTITY, |
69 | NULL, NULL, NULL, NULL, 0, 1 |
70 | }; |
71 | |
72 | /** |
73 | * xmlEntitiesErrMemory: |
74 | * @extra: extra informations |
75 | * |
76 | * Handle an out of memory condition |
77 | */ |
78 | static void |
79 | xmlEntitiesErrMemory(const char *) |
80 | { |
81 | __xmlSimpleError(XML_FROM_TREE, XML_ERR_NO_MEMORY, NULL, NULL, extra); |
82 | } |
83 | |
84 | /** |
85 | * xmlEntitiesErr: |
86 | * @code: the error code |
87 | * @msg: the message |
88 | * |
89 | * Handle an out of memory condition |
90 | */ |
91 | static void LIBXML_ATTR_FORMAT(2,0) |
92 | xmlEntitiesErr(xmlParserErrors code, const char *msg) |
93 | { |
94 | __xmlSimpleError(XML_FROM_TREE, code, NULL, msg, NULL); |
95 | } |
96 | |
97 | /* |
98 | * xmlFreeEntity : clean-up an entity record. |
99 | */ |
100 | static void |
101 | xmlFreeEntity(xmlEntityPtr entity) |
102 | { |
103 | xmlDictPtr dict = NULL; |
104 | |
105 | if (entity == NULL) |
106 | return; |
107 | |
108 | if (entity->doc != NULL) |
109 | dict = entity->doc->dict; |
110 | |
111 | |
112 | if ((entity->children) && (entity->owner == 1) && |
113 | (entity == (xmlEntityPtr) entity->children->parent)) |
114 | xmlFreeNodeList(entity->children); |
115 | if (dict != NULL) { |
116 | if ((entity->name != NULL) && (!xmlDictOwns(dict, entity->name))) |
117 | xmlFree((char *) entity->name); |
118 | if ((entity->ExternalID != NULL) && |
119 | (!xmlDictOwns(dict, entity->ExternalID))) |
120 | xmlFree((char *) entity->ExternalID); |
121 | if ((entity->SystemID != NULL) && |
122 | (!xmlDictOwns(dict, entity->SystemID))) |
123 | xmlFree((char *) entity->SystemID); |
124 | if ((entity->URI != NULL) && (!xmlDictOwns(dict, entity->URI))) |
125 | xmlFree((char *) entity->URI); |
126 | if ((entity->content != NULL) |
127 | && (!xmlDictOwns(dict, entity->content))) |
128 | xmlFree((char *) entity->content); |
129 | if ((entity->orig != NULL) && (!xmlDictOwns(dict, entity->orig))) |
130 | xmlFree((char *) entity->orig); |
131 | } else { |
132 | if (entity->name != NULL) |
133 | xmlFree((char *) entity->name); |
134 | if (entity->ExternalID != NULL) |
135 | xmlFree((char *) entity->ExternalID); |
136 | if (entity->SystemID != NULL) |
137 | xmlFree((char *) entity->SystemID); |
138 | if (entity->URI != NULL) |
139 | xmlFree((char *) entity->URI); |
140 | if (entity->content != NULL) |
141 | xmlFree((char *) entity->content); |
142 | if (entity->orig != NULL) |
143 | xmlFree((char *) entity->orig); |
144 | } |
145 | xmlFree(entity); |
146 | } |
147 | |
148 | /* |
149 | * xmlCreateEntity: |
150 | * |
151 | * internal routine doing the entity node strutures allocations |
152 | */ |
153 | static xmlEntityPtr |
154 | xmlCreateEntity(xmlDictPtr dict, const xmlChar *name, int type, |
155 | const xmlChar *ExternalID, const xmlChar *SystemID, |
156 | const xmlChar *content) { |
157 | xmlEntityPtr ret; |
158 | |
159 | ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity)); |
160 | if (ret == NULL) { |
161 | xmlEntitiesErrMemory("xmlCreateEntity: malloc failed" ); |
162 | return(NULL); |
163 | } |
164 | memset(ret, 0, sizeof(xmlEntity)); |
165 | ret->type = XML_ENTITY_DECL; |
166 | ret->checked = 0; |
167 | |
168 | /* |
169 | * fill the structure. |
170 | */ |
171 | ret->etype = (xmlEntityType) type; |
172 | if (dict == NULL) { |
173 | ret->name = xmlStrdup(name); |
174 | if (ExternalID != NULL) |
175 | ret->ExternalID = xmlStrdup(ExternalID); |
176 | if (SystemID != NULL) |
177 | ret->SystemID = xmlStrdup(SystemID); |
178 | } else { |
179 | ret->name = xmlDictLookup(dict, name, -1); |
180 | if (ExternalID != NULL) |
181 | ret->ExternalID = xmlDictLookup(dict, ExternalID, -1); |
182 | if (SystemID != NULL) |
183 | ret->SystemID = xmlDictLookup(dict, SystemID, -1); |
184 | } |
185 | if (content != NULL) { |
186 | ret->length = xmlStrlen(content); |
187 | if ((dict != NULL) && (ret->length < 5)) |
188 | ret->content = (xmlChar *) |
189 | xmlDictLookup(dict, content, ret->length); |
190 | else |
191 | ret->content = xmlStrndup(content, ret->length); |
192 | } else { |
193 | ret->length = 0; |
194 | ret->content = NULL; |
195 | } |
196 | ret->URI = NULL; /* to be computed by the layer knowing |
197 | the defining entity */ |
198 | ret->orig = NULL; |
199 | ret->owner = 0; |
200 | |
201 | return(ret); |
202 | } |
203 | |
204 | /* |
205 | * xmlAddEntity : register a new entity for an entities table. |
206 | */ |
207 | static xmlEntityPtr |
208 | xmlAddEntity(xmlDtdPtr dtd, const xmlChar *name, int type, |
209 | const xmlChar *ExternalID, const xmlChar *SystemID, |
210 | const xmlChar *content) { |
211 | xmlDictPtr dict = NULL; |
212 | xmlEntitiesTablePtr table = NULL; |
213 | xmlEntityPtr ret; |
214 | |
215 | if (name == NULL) |
216 | return(NULL); |
217 | if (dtd == NULL) |
218 | return(NULL); |
219 | if (dtd->doc != NULL) |
220 | dict = dtd->doc->dict; |
221 | |
222 | switch (type) { |
223 | case XML_INTERNAL_GENERAL_ENTITY: |
224 | case XML_EXTERNAL_GENERAL_PARSED_ENTITY: |
225 | case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY: |
226 | if (dtd->entities == NULL) |
227 | dtd->entities = xmlHashCreateDict(0, dict); |
228 | table = dtd->entities; |
229 | break; |
230 | case XML_INTERNAL_PARAMETER_ENTITY: |
231 | case XML_EXTERNAL_PARAMETER_ENTITY: |
232 | if (dtd->pentities == NULL) |
233 | dtd->pentities = xmlHashCreateDict(0, dict); |
234 | table = dtd->pentities; |
235 | break; |
236 | case XML_INTERNAL_PREDEFINED_ENTITY: |
237 | return(NULL); |
238 | } |
239 | if (table == NULL) |
240 | return(NULL); |
241 | ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content); |
242 | if (ret == NULL) |
243 | return(NULL); |
244 | ret->doc = dtd->doc; |
245 | |
246 | if (xmlHashAddEntry(table, name, ret)) { |
247 | /* |
248 | * entity was already defined at another level. |
249 | */ |
250 | xmlFreeEntity(ret); |
251 | return(NULL); |
252 | } |
253 | return(ret); |
254 | } |
255 | |
256 | /** |
257 | * xmlGetPredefinedEntity: |
258 | * @name: the entity name |
259 | * |
260 | * Check whether this name is an predefined entity. |
261 | * |
262 | * Returns NULL if not, otherwise the entity |
263 | */ |
264 | xmlEntityPtr |
265 | xmlGetPredefinedEntity(const xmlChar *name) { |
266 | if (name == NULL) return(NULL); |
267 | switch (name[0]) { |
268 | case 'l': |
269 | if (xmlStrEqual(name, BAD_CAST "lt" )) |
270 | return(&xmlEntityLt); |
271 | break; |
272 | case 'g': |
273 | if (xmlStrEqual(name, BAD_CAST "gt" )) |
274 | return(&xmlEntityGt); |
275 | break; |
276 | case 'a': |
277 | if (xmlStrEqual(name, BAD_CAST "amp" )) |
278 | return(&xmlEntityAmp); |
279 | if (xmlStrEqual(name, BAD_CAST "apos" )) |
280 | return(&xmlEntityApos); |
281 | break; |
282 | case 'q': |
283 | if (xmlStrEqual(name, BAD_CAST "quot" )) |
284 | return(&xmlEntityQuot); |
285 | break; |
286 | default: |
287 | break; |
288 | } |
289 | return(NULL); |
290 | } |
291 | |
292 | /** |
293 | * xmlAddDtdEntity: |
294 | * @doc: the document |
295 | * @name: the entity name |
296 | * @type: the entity type XML_xxx_yyy_ENTITY |
297 | * @ExternalID: the entity external ID if available |
298 | * @SystemID: the entity system ID if available |
299 | * @content: the entity content |
300 | * |
301 | * Register a new entity for this document DTD external subset. |
302 | * |
303 | * Returns a pointer to the entity or NULL in case of error |
304 | */ |
305 | xmlEntityPtr |
306 | xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type, |
307 | const xmlChar *ExternalID, const xmlChar *SystemID, |
308 | const xmlChar *content) { |
309 | xmlEntityPtr ret; |
310 | xmlDtdPtr dtd; |
311 | |
312 | if (doc == NULL) { |
313 | xmlEntitiesErr(XML_DTD_NO_DOC, |
314 | "xmlAddDtdEntity: document is NULL" ); |
315 | return(NULL); |
316 | } |
317 | if (doc->extSubset == NULL) { |
318 | xmlEntitiesErr(XML_DTD_NO_DTD, |
319 | "xmlAddDtdEntity: document without external subset" ); |
320 | return(NULL); |
321 | } |
322 | dtd = doc->extSubset; |
323 | ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content); |
324 | if (ret == NULL) return(NULL); |
325 | |
326 | /* |
327 | * Link it to the DTD |
328 | */ |
329 | ret->parent = dtd; |
330 | ret->doc = dtd->doc; |
331 | if (dtd->last == NULL) { |
332 | dtd->children = dtd->last = (xmlNodePtr) ret; |
333 | } else { |
334 | dtd->last->next = (xmlNodePtr) ret; |
335 | ret->prev = dtd->last; |
336 | dtd->last = (xmlNodePtr) ret; |
337 | } |
338 | return(ret); |
339 | } |
340 | |
341 | /** |
342 | * xmlAddDocEntity: |
343 | * @doc: the document |
344 | * @name: the entity name |
345 | * @type: the entity type XML_xxx_yyy_ENTITY |
346 | * @ExternalID: the entity external ID if available |
347 | * @SystemID: the entity system ID if available |
348 | * @content: the entity content |
349 | * |
350 | * Register a new entity for this document. |
351 | * |
352 | * Returns a pointer to the entity or NULL in case of error |
353 | */ |
354 | xmlEntityPtr |
355 | xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type, |
356 | const xmlChar *ExternalID, const xmlChar *SystemID, |
357 | const xmlChar *content) { |
358 | xmlEntityPtr ret; |
359 | xmlDtdPtr dtd; |
360 | |
361 | if (doc == NULL) { |
362 | xmlEntitiesErr(XML_DTD_NO_DOC, |
363 | "xmlAddDocEntity: document is NULL" ); |
364 | return(NULL); |
365 | } |
366 | if (doc->intSubset == NULL) { |
367 | xmlEntitiesErr(XML_DTD_NO_DTD, |
368 | "xmlAddDocEntity: document without internal subset" ); |
369 | return(NULL); |
370 | } |
371 | dtd = doc->intSubset; |
372 | ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content); |
373 | if (ret == NULL) return(NULL); |
374 | |
375 | /* |
376 | * Link it to the DTD |
377 | */ |
378 | ret->parent = dtd; |
379 | ret->doc = dtd->doc; |
380 | if (dtd->last == NULL) { |
381 | dtd->children = dtd->last = (xmlNodePtr) ret; |
382 | } else { |
383 | dtd->last->next = (xmlNodePtr) ret; |
384 | ret->prev = dtd->last; |
385 | dtd->last = (xmlNodePtr) ret; |
386 | } |
387 | return(ret); |
388 | } |
389 | |
390 | /** |
391 | * xmlNewEntity: |
392 | * @doc: the document |
393 | * @name: the entity name |
394 | * @type: the entity type XML_xxx_yyy_ENTITY |
395 | * @ExternalID: the entity external ID if available |
396 | * @SystemID: the entity system ID if available |
397 | * @content: the entity content |
398 | * |
399 | * Create a new entity, this differs from xmlAddDocEntity() that if |
400 | * the document is NULL or has no internal subset defined, then an |
401 | * unlinked entity structure will be returned, it is then the responsability |
402 | * of the caller to link it to the document later or free it when not needed |
403 | * anymore. |
404 | * |
405 | * Returns a pointer to the entity or NULL in case of error |
406 | */ |
407 | xmlEntityPtr |
408 | xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type, |
409 | const xmlChar *ExternalID, const xmlChar *SystemID, |
410 | const xmlChar *content) { |
411 | xmlEntityPtr ret; |
412 | xmlDictPtr dict; |
413 | |
414 | if ((doc != NULL) && (doc->intSubset != NULL)) { |
415 | return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content)); |
416 | } |
417 | if (doc != NULL) |
418 | dict = doc->dict; |
419 | else |
420 | dict = NULL; |
421 | ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content); |
422 | if (ret == NULL) |
423 | return(NULL); |
424 | ret->doc = doc; |
425 | return(ret); |
426 | } |
427 | |
428 | /** |
429 | * xmlGetEntityFromTable: |
430 | * @table: an entity table |
431 | * @name: the entity name |
432 | * @parameter: look for parameter entities |
433 | * |
434 | * Do an entity lookup in the table. |
435 | * returns the corresponding parameter entity, if found. |
436 | * |
437 | * Returns A pointer to the entity structure or NULL if not found. |
438 | */ |
439 | static xmlEntityPtr |
440 | xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) { |
441 | return((xmlEntityPtr) xmlHashLookup(table, name)); |
442 | } |
443 | |
444 | /** |
445 | * xmlGetParameterEntity: |
446 | * @doc: the document referencing the entity |
447 | * @name: the entity name |
448 | * |
449 | * Do an entity lookup in the internal and external subsets and |
450 | * returns the corresponding parameter entity, if found. |
451 | * |
452 | * Returns A pointer to the entity structure or NULL if not found. |
453 | */ |
454 | xmlEntityPtr |
455 | xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) { |
456 | xmlEntitiesTablePtr table; |
457 | xmlEntityPtr ret; |
458 | |
459 | if (doc == NULL) |
460 | return(NULL); |
461 | if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) { |
462 | table = (xmlEntitiesTablePtr) doc->intSubset->pentities; |
463 | ret = xmlGetEntityFromTable(table, name); |
464 | if (ret != NULL) |
465 | return(ret); |
466 | } |
467 | if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) { |
468 | table = (xmlEntitiesTablePtr) doc->extSubset->pentities; |
469 | return(xmlGetEntityFromTable(table, name)); |
470 | } |
471 | return(NULL); |
472 | } |
473 | |
474 | /** |
475 | * xmlGetDtdEntity: |
476 | * @doc: the document referencing the entity |
477 | * @name: the entity name |
478 | * |
479 | * Do an entity lookup in the DTD entity hash table and |
480 | * returns the corresponding entity, if found. |
481 | * Note: the first argument is the document node, not the DTD node. |
482 | * |
483 | * Returns A pointer to the entity structure or NULL if not found. |
484 | */ |
485 | xmlEntityPtr |
486 | xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) { |
487 | xmlEntitiesTablePtr table; |
488 | |
489 | if (doc == NULL) |
490 | return(NULL); |
491 | if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) { |
492 | table = (xmlEntitiesTablePtr) doc->extSubset->entities; |
493 | return(xmlGetEntityFromTable(table, name)); |
494 | } |
495 | return(NULL); |
496 | } |
497 | |
498 | /** |
499 | * xmlGetDocEntity: |
500 | * @doc: the document referencing the entity |
501 | * @name: the entity name |
502 | * |
503 | * Do an entity lookup in the document entity hash table and |
504 | * returns the corresponding entity, otherwise a lookup is done |
505 | * in the predefined entities too. |
506 | * |
507 | * Returns A pointer to the entity structure or NULL if not found. |
508 | */ |
509 | xmlEntityPtr |
510 | xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) { |
511 | xmlEntityPtr cur; |
512 | xmlEntitiesTablePtr table; |
513 | |
514 | if (doc != NULL) { |
515 | if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) { |
516 | table = (xmlEntitiesTablePtr) doc->intSubset->entities; |
517 | cur = xmlGetEntityFromTable(table, name); |
518 | if (cur != NULL) |
519 | return(cur); |
520 | } |
521 | if (doc->standalone != 1) { |
522 | if ((doc->extSubset != NULL) && |
523 | (doc->extSubset->entities != NULL)) { |
524 | table = (xmlEntitiesTablePtr) doc->extSubset->entities; |
525 | cur = xmlGetEntityFromTable(table, name); |
526 | if (cur != NULL) |
527 | return(cur); |
528 | } |
529 | } |
530 | } |
531 | return(xmlGetPredefinedEntity(name)); |
532 | } |
533 | |
534 | /* |
535 | * Macro used to grow the current buffer. |
536 | */ |
537 | #define growBufferReentrant() { \ |
538 | xmlChar *tmp; \ |
539 | size_t new_size = buffer_size * 2; \ |
540 | if (new_size < buffer_size) goto mem_error; \ |
541 | tmp = (xmlChar *) xmlRealloc(buffer, new_size); \ |
542 | if (tmp == NULL) goto mem_error; \ |
543 | buffer = tmp; \ |
544 | buffer_size = new_size; \ |
545 | } |
546 | |
547 | /** |
548 | * xmlEncodeEntitiesInternal: |
549 | * @doc: the document containing the string |
550 | * @input: A string to convert to XML. |
551 | * @attr: are we handling an atrbute value |
552 | * |
553 | * Do a global encoding of a string, replacing the predefined entities |
554 | * and non ASCII values with their entities and CharRef counterparts. |
555 | * Contrary to xmlEncodeEntities, this routine is reentrant, and result |
556 | * must be deallocated. |
557 | * |
558 | * Returns A newly allocated string with the substitution done. |
559 | */ |
560 | static xmlChar * |
561 | xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input, int attr) { |
562 | const xmlChar *cur = input; |
563 | xmlChar *buffer = NULL; |
564 | xmlChar *out = NULL; |
565 | size_t buffer_size = 0; |
566 | int html = 0; |
567 | |
568 | if (input == NULL) return(NULL); |
569 | if (doc != NULL) |
570 | html = (doc->type == XML_HTML_DOCUMENT_NODE); |
571 | |
572 | /* |
573 | * allocate an translation buffer. |
574 | */ |
575 | buffer_size = 1000; |
576 | buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar)); |
577 | if (buffer == NULL) { |
578 | xmlEntitiesErrMemory("xmlEncodeEntities: malloc failed" ); |
579 | return(NULL); |
580 | } |
581 | out = buffer; |
582 | |
583 | while (*cur != '\0') { |
584 | size_t indx = out - buffer; |
585 | if (indx + 100 > buffer_size) { |
586 | |
587 | growBufferReentrant(); |
588 | out = &buffer[indx]; |
589 | } |
590 | |
591 | /* |
592 | * By default one have to encode at least '<', '>', '"' and '&' ! |
593 | */ |
594 | if (*cur == '<') { |
595 | const xmlChar *end; |
596 | |
597 | /* |
598 | * Special handling of server side include in HTML attributes |
599 | */ |
600 | if (html && attr && |
601 | (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') && |
602 | ((end = xmlStrstr(cur, BAD_CAST "-->" )) != NULL)) { |
603 | while (cur != end) { |
604 | *out++ = *cur++; |
605 | indx = out - buffer; |
606 | if (indx + 100 > buffer_size) { |
607 | growBufferReentrant(); |
608 | out = &buffer[indx]; |
609 | } |
610 | } |
611 | *out++ = *cur++; |
612 | *out++ = *cur++; |
613 | *out++ = *cur++; |
614 | continue; |
615 | } |
616 | *out++ = '&'; |
617 | *out++ = 'l'; |
618 | *out++ = 't'; |
619 | *out++ = ';'; |
620 | } else if (*cur == '>') { |
621 | *out++ = '&'; |
622 | *out++ = 'g'; |
623 | *out++ = 't'; |
624 | *out++ = ';'; |
625 | } else if (*cur == '&') { |
626 | /* |
627 | * Special handling of &{...} construct from HTML 4, see |
628 | * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1 |
629 | */ |
630 | if (html && attr && (cur[1] == '{') && |
631 | (strchr((const char *) cur, '}'))) { |
632 | while (*cur != '}') { |
633 | *out++ = *cur++; |
634 | indx = out - buffer; |
635 | if (indx + 100 > buffer_size) { |
636 | growBufferReentrant(); |
637 | out = &buffer[indx]; |
638 | } |
639 | } |
640 | *out++ = *cur++; |
641 | continue; |
642 | } |
643 | *out++ = '&'; |
644 | *out++ = 'a'; |
645 | *out++ = 'm'; |
646 | *out++ = 'p'; |
647 | *out++ = ';'; |
648 | } else if (((*cur >= 0x20) && (*cur < 0x80)) || |
649 | (*cur == '\n') || (*cur == '\t') || ((html) && (*cur == '\r'))) { |
650 | /* |
651 | * default case, just copy ! |
652 | */ |
653 | *out++ = *cur; |
654 | } else if (*cur >= 0x80) { |
655 | if (((doc != NULL) && (doc->encoding != NULL)) || (html)) { |
656 | /* |
657 | * Bjørn Reese <br@sseusa.com> provided the patch |
658 | xmlChar xc; |
659 | xc = (*cur & 0x3F) << 6; |
660 | if (cur[1] != 0) { |
661 | xc += *(++cur) & 0x3F; |
662 | *out++ = xc; |
663 | } else |
664 | */ |
665 | *out++ = *cur; |
666 | } else { |
667 | /* |
668 | * We assume we have UTF-8 input. |
669 | */ |
670 | char buf[11], *ptr; |
671 | int val = 0, l = 1; |
672 | |
673 | if (*cur < 0xC0) { |
674 | xmlEntitiesErr(XML_CHECK_NOT_UTF8, |
675 | "xmlEncodeEntities: input not UTF-8" ); |
676 | if (doc != NULL) |
677 | doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1" ); |
678 | snprintf(buf, sizeof(buf), "&#%d;" , *cur); |
679 | buf[sizeof(buf) - 1] = 0; |
680 | ptr = buf; |
681 | while (*ptr != 0) *out++ = *ptr++; |
682 | cur++; |
683 | continue; |
684 | } else if (*cur < 0xE0) { |
685 | val = (cur[0]) & 0x1F; |
686 | val <<= 6; |
687 | val |= (cur[1]) & 0x3F; |
688 | l = 2; |
689 | } else if (*cur < 0xF0) { |
690 | val = (cur[0]) & 0x0F; |
691 | val <<= 6; |
692 | val |= (cur[1]) & 0x3F; |
693 | val <<= 6; |
694 | val |= (cur[2]) & 0x3F; |
695 | l = 3; |
696 | } else if (*cur < 0xF8) { |
697 | val = (cur[0]) & 0x07; |
698 | val <<= 6; |
699 | val |= (cur[1]) & 0x3F; |
700 | val <<= 6; |
701 | val |= (cur[2]) & 0x3F; |
702 | val <<= 6; |
703 | val |= (cur[3]) & 0x3F; |
704 | l = 4; |
705 | } |
706 | if ((l == 1) || (!IS_CHAR(val))) { |
707 | xmlEntitiesErr(XML_ERR_INVALID_CHAR, |
708 | "xmlEncodeEntities: char out of range\n" ); |
709 | if (doc != NULL) |
710 | doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1" ); |
711 | snprintf(buf, sizeof(buf), "&#%d;" , *cur); |
712 | buf[sizeof(buf) - 1] = 0; |
713 | ptr = buf; |
714 | while (*ptr != 0) *out++ = *ptr++; |
715 | cur++; |
716 | continue; |
717 | } |
718 | /* |
719 | * We could do multiple things here. Just save as a char ref |
720 | */ |
721 | snprintf(buf, sizeof(buf), "&#x%X;" , val); |
722 | buf[sizeof(buf) - 1] = 0; |
723 | ptr = buf; |
724 | while (*ptr != 0) *out++ = *ptr++; |
725 | cur += l; |
726 | continue; |
727 | } |
728 | } else if (IS_BYTE_CHAR(*cur)) { |
729 | char buf[11], *ptr; |
730 | |
731 | snprintf(buf, sizeof(buf), "&#%d;" , *cur); |
732 | buf[sizeof(buf) - 1] = 0; |
733 | ptr = buf; |
734 | while (*ptr != 0) *out++ = *ptr++; |
735 | } |
736 | cur++; |
737 | } |
738 | *out = 0; |
739 | return(buffer); |
740 | |
741 | mem_error: |
742 | xmlEntitiesErrMemory("xmlEncodeEntities: realloc failed" ); |
743 | xmlFree(buffer); |
744 | return(NULL); |
745 | } |
746 | |
747 | /** |
748 | * xmlEncodeAttributeEntities: |
749 | * @doc: the document containing the string |
750 | * @input: A string to convert to XML. |
751 | * |
752 | * Do a global encoding of a string, replacing the predefined entities |
753 | * and non ASCII values with their entities and CharRef counterparts for |
754 | * attribute values. |
755 | * |
756 | * Returns A newly allocated string with the substitution done. |
757 | */ |
758 | xmlChar * |
759 | xmlEncodeAttributeEntities(xmlDocPtr doc, const xmlChar *input) { |
760 | return xmlEncodeEntitiesInternal(doc, input, 1); |
761 | } |
762 | |
763 | /** |
764 | * xmlEncodeEntitiesReentrant: |
765 | * @doc: the document containing the string |
766 | * @input: A string to convert to XML. |
767 | * |
768 | * Do a global encoding of a string, replacing the predefined entities |
769 | * and non ASCII values with their entities and CharRef counterparts. |
770 | * Contrary to xmlEncodeEntities, this routine is reentrant, and result |
771 | * must be deallocated. |
772 | * |
773 | * Returns A newly allocated string with the substitution done. |
774 | */ |
775 | xmlChar * |
776 | xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) { |
777 | return xmlEncodeEntitiesInternal(doc, input, 0); |
778 | } |
779 | |
780 | /** |
781 | * xmlEncodeSpecialChars: |
782 | * @doc: the document containing the string |
783 | * @input: A string to convert to XML. |
784 | * |
785 | * Do a global encoding of a string, replacing the predefined entities |
786 | * this routine is reentrant, and result must be deallocated. |
787 | * |
788 | * Returns A newly allocated string with the substitution done. |
789 | */ |
790 | xmlChar * |
791 | xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED, const xmlChar *input) { |
792 | const xmlChar *cur = input; |
793 | xmlChar *buffer = NULL; |
794 | xmlChar *out = NULL; |
795 | size_t buffer_size = 0; |
796 | if (input == NULL) return(NULL); |
797 | |
798 | /* |
799 | * allocate an translation buffer. |
800 | */ |
801 | buffer_size = 1000; |
802 | buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar)); |
803 | if (buffer == NULL) { |
804 | xmlEntitiesErrMemory("xmlEncodeSpecialChars: malloc failed" ); |
805 | return(NULL); |
806 | } |
807 | out = buffer; |
808 | |
809 | while (*cur != '\0') { |
810 | size_t indx = out - buffer; |
811 | if (indx + 10 > buffer_size) { |
812 | |
813 | growBufferReentrant(); |
814 | out = &buffer[indx]; |
815 | } |
816 | |
817 | /* |
818 | * By default one have to encode at least '<', '>', '"' and '&' ! |
819 | */ |
820 | if (*cur == '<') { |
821 | *out++ = '&'; |
822 | *out++ = 'l'; |
823 | *out++ = 't'; |
824 | *out++ = ';'; |
825 | } else if (*cur == '>') { |
826 | *out++ = '&'; |
827 | *out++ = 'g'; |
828 | *out++ = 't'; |
829 | *out++ = ';'; |
830 | } else if (*cur == '&') { |
831 | *out++ = '&'; |
832 | *out++ = 'a'; |
833 | *out++ = 'm'; |
834 | *out++ = 'p'; |
835 | *out++ = ';'; |
836 | } else if (*cur == '"') { |
837 | *out++ = '&'; |
838 | *out++ = 'q'; |
839 | *out++ = 'u'; |
840 | *out++ = 'o'; |
841 | *out++ = 't'; |
842 | *out++ = ';'; |
843 | } else if (*cur == '\r') { |
844 | *out++ = '&'; |
845 | *out++ = '#'; |
846 | *out++ = '1'; |
847 | *out++ = '3'; |
848 | *out++ = ';'; |
849 | } else { |
850 | /* |
851 | * Works because on UTF-8, all extended sequences cannot |
852 | * result in bytes in the ASCII range. |
853 | */ |
854 | *out++ = *cur; |
855 | } |
856 | cur++; |
857 | } |
858 | *out = 0; |
859 | return(buffer); |
860 | |
861 | mem_error: |
862 | xmlEntitiesErrMemory("xmlEncodeSpecialChars: realloc failed" ); |
863 | xmlFree(buffer); |
864 | return(NULL); |
865 | } |
866 | |
867 | /** |
868 | * xmlCreateEntitiesTable: |
869 | * |
870 | * create and initialize an empty entities hash table. |
871 | * This really doesn't make sense and should be deprecated |
872 | * |
873 | * Returns the xmlEntitiesTablePtr just created or NULL in case of error. |
874 | */ |
875 | xmlEntitiesTablePtr |
876 | xmlCreateEntitiesTable(void) { |
877 | return((xmlEntitiesTablePtr) xmlHashCreate(0)); |
878 | } |
879 | |
880 | /** |
881 | * xmlFreeEntityWrapper: |
882 | * @entity: An entity |
883 | * @name: its name |
884 | * |
885 | * Deallocate the memory used by an entities in the hash table. |
886 | */ |
887 | static void |
888 | xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) { |
889 | if (entity != NULL) |
890 | xmlFreeEntity((xmlEntityPtr) entity); |
891 | } |
892 | |
893 | /** |
894 | * xmlFreeEntitiesTable: |
895 | * @table: An entity table |
896 | * |
897 | * Deallocate the memory used by an entities hash table. |
898 | */ |
899 | void |
900 | xmlFreeEntitiesTable(xmlEntitiesTablePtr table) { |
901 | xmlHashFree(table, xmlFreeEntityWrapper); |
902 | } |
903 | |
904 | #ifdef LIBXML_TREE_ENABLED |
905 | /** |
906 | * xmlCopyEntity: |
907 | * @ent: An entity |
908 | * |
909 | * Build a copy of an entity |
910 | * |
911 | * Returns the new xmlEntitiesPtr or NULL in case of error. |
912 | */ |
913 | static void * |
914 | xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) { |
915 | xmlEntityPtr ent = (xmlEntityPtr) payload; |
916 | xmlEntityPtr cur; |
917 | |
918 | cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity)); |
919 | if (cur == NULL) { |
920 | xmlEntitiesErrMemory("xmlCopyEntity:: malloc failed" ); |
921 | return(NULL); |
922 | } |
923 | memset(cur, 0, sizeof(xmlEntity)); |
924 | cur->type = XML_ENTITY_DECL; |
925 | |
926 | cur->etype = ent->etype; |
927 | if (ent->name != NULL) |
928 | cur->name = xmlStrdup(ent->name); |
929 | if (ent->ExternalID != NULL) |
930 | cur->ExternalID = xmlStrdup(ent->ExternalID); |
931 | if (ent->SystemID != NULL) |
932 | cur->SystemID = xmlStrdup(ent->SystemID); |
933 | if (ent->content != NULL) |
934 | cur->content = xmlStrdup(ent->content); |
935 | if (ent->orig != NULL) |
936 | cur->orig = xmlStrdup(ent->orig); |
937 | if (ent->URI != NULL) |
938 | cur->URI = xmlStrdup(ent->URI); |
939 | return(cur); |
940 | } |
941 | |
942 | /** |
943 | * xmlCopyEntitiesTable: |
944 | * @table: An entity table |
945 | * |
946 | * Build a copy of an entity table. |
947 | * |
948 | * Returns the new xmlEntitiesTablePtr or NULL in case of error. |
949 | */ |
950 | xmlEntitiesTablePtr |
951 | xmlCopyEntitiesTable(xmlEntitiesTablePtr table) { |
952 | return(xmlHashCopy(table, xmlCopyEntity)); |
953 | } |
954 | #endif /* LIBXML_TREE_ENABLED */ |
955 | |
956 | #ifdef LIBXML_OUTPUT_ENABLED |
957 | |
958 | /** |
959 | * xmlDumpEntityContent: |
960 | * @buf: An XML buffer. |
961 | * @content: The entity content. |
962 | * |
963 | * This will dump the quoted string value, taking care of the special |
964 | * treatment required by % |
965 | */ |
966 | static void |
967 | xmlDumpEntityContent(xmlBufferPtr buf, const xmlChar *content) { |
968 | if (buf->alloc == XML_BUFFER_ALLOC_IMMUTABLE) return; |
969 | if (xmlStrchr(content, '%')) { |
970 | const xmlChar * base, *cur; |
971 | |
972 | xmlBufferCCat(buf, "\"" ); |
973 | base = cur = content; |
974 | while (*cur != 0) { |
975 | if (*cur == '"') { |
976 | if (base != cur) |
977 | xmlBufferAdd(buf, base, cur - base); |
978 | xmlBufferAdd(buf, BAD_CAST """ , 6); |
979 | cur++; |
980 | base = cur; |
981 | } else if (*cur == '%') { |
982 | if (base != cur) |
983 | xmlBufferAdd(buf, base, cur - base); |
984 | xmlBufferAdd(buf, BAD_CAST "%" , 6); |
985 | cur++; |
986 | base = cur; |
987 | } else { |
988 | cur++; |
989 | } |
990 | } |
991 | if (base != cur) |
992 | xmlBufferAdd(buf, base, cur - base); |
993 | xmlBufferCCat(buf, "\"" ); |
994 | } else { |
995 | xmlBufferWriteQuotedString(buf, content); |
996 | } |
997 | } |
998 | |
999 | /** |
1000 | * xmlDumpEntityDecl: |
1001 | * @buf: An XML buffer. |
1002 | * @ent: An entity table |
1003 | * |
1004 | * This will dump the content of the entity table as an XML DTD definition |
1005 | */ |
1006 | void |
1007 | xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) { |
1008 | if ((buf == NULL) || (ent == NULL)) return; |
1009 | switch (ent->etype) { |
1010 | case XML_INTERNAL_GENERAL_ENTITY: |
1011 | xmlBufferWriteChar(buf, "<!ENTITY " ); |
1012 | xmlBufferWriteCHAR(buf, ent->name); |
1013 | xmlBufferWriteChar(buf, " " ); |
1014 | if (ent->orig != NULL) |
1015 | xmlBufferWriteQuotedString(buf, ent->orig); |
1016 | else |
1017 | xmlDumpEntityContent(buf, ent->content); |
1018 | xmlBufferWriteChar(buf, ">\n" ); |
1019 | break; |
1020 | case XML_EXTERNAL_GENERAL_PARSED_ENTITY: |
1021 | xmlBufferWriteChar(buf, "<!ENTITY " ); |
1022 | xmlBufferWriteCHAR(buf, ent->name); |
1023 | if (ent->ExternalID != NULL) { |
1024 | xmlBufferWriteChar(buf, " PUBLIC " ); |
1025 | xmlBufferWriteQuotedString(buf, ent->ExternalID); |
1026 | xmlBufferWriteChar(buf, " " ); |
1027 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1028 | } else { |
1029 | xmlBufferWriteChar(buf, " SYSTEM " ); |
1030 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1031 | } |
1032 | xmlBufferWriteChar(buf, ">\n" ); |
1033 | break; |
1034 | case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY: |
1035 | xmlBufferWriteChar(buf, "<!ENTITY " ); |
1036 | xmlBufferWriteCHAR(buf, ent->name); |
1037 | if (ent->ExternalID != NULL) { |
1038 | xmlBufferWriteChar(buf, " PUBLIC " ); |
1039 | xmlBufferWriteQuotedString(buf, ent->ExternalID); |
1040 | xmlBufferWriteChar(buf, " " ); |
1041 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1042 | } else { |
1043 | xmlBufferWriteChar(buf, " SYSTEM " ); |
1044 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1045 | } |
1046 | if (ent->content != NULL) { /* Should be true ! */ |
1047 | xmlBufferWriteChar(buf, " NDATA " ); |
1048 | if (ent->orig != NULL) |
1049 | xmlBufferWriteCHAR(buf, ent->orig); |
1050 | else |
1051 | xmlBufferWriteCHAR(buf, ent->content); |
1052 | } |
1053 | xmlBufferWriteChar(buf, ">\n" ); |
1054 | break; |
1055 | case XML_INTERNAL_PARAMETER_ENTITY: |
1056 | xmlBufferWriteChar(buf, "<!ENTITY % " ); |
1057 | xmlBufferWriteCHAR(buf, ent->name); |
1058 | xmlBufferWriteChar(buf, " " ); |
1059 | if (ent->orig == NULL) |
1060 | xmlDumpEntityContent(buf, ent->content); |
1061 | else |
1062 | xmlBufferWriteQuotedString(buf, ent->orig); |
1063 | xmlBufferWriteChar(buf, ">\n" ); |
1064 | break; |
1065 | case XML_EXTERNAL_PARAMETER_ENTITY: |
1066 | xmlBufferWriteChar(buf, "<!ENTITY % " ); |
1067 | xmlBufferWriteCHAR(buf, ent->name); |
1068 | if (ent->ExternalID != NULL) { |
1069 | xmlBufferWriteChar(buf, " PUBLIC " ); |
1070 | xmlBufferWriteQuotedString(buf, ent->ExternalID); |
1071 | xmlBufferWriteChar(buf, " " ); |
1072 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1073 | } else { |
1074 | xmlBufferWriteChar(buf, " SYSTEM " ); |
1075 | xmlBufferWriteQuotedString(buf, ent->SystemID); |
1076 | } |
1077 | xmlBufferWriteChar(buf, ">\n" ); |
1078 | break; |
1079 | default: |
1080 | xmlEntitiesErr(XML_DTD_UNKNOWN_ENTITY, |
1081 | "xmlDumpEntitiesDecl: internal: unknown type entity type" ); |
1082 | } |
1083 | } |
1084 | |
1085 | /** |
1086 | * xmlDumpEntityDeclScan: |
1087 | * @ent: An entity table |
1088 | * @buf: An XML buffer. |
1089 | * |
1090 | * When using the hash table scan function, arguments need to be reversed |
1091 | */ |
1092 | static void |
1093 | xmlDumpEntityDeclScan(void *ent, void *buf, |
1094 | const xmlChar *name ATTRIBUTE_UNUSED) { |
1095 | xmlDumpEntityDecl((xmlBufferPtr) buf, (xmlEntityPtr) ent); |
1096 | } |
1097 | |
1098 | /** |
1099 | * xmlDumpEntitiesTable: |
1100 | * @buf: An XML buffer. |
1101 | * @table: An entity table |
1102 | * |
1103 | * This will dump the content of the entity table as an XML DTD definition |
1104 | */ |
1105 | void |
1106 | xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) { |
1107 | xmlHashScan(table, xmlDumpEntityDeclScan, buf); |
1108 | } |
1109 | #endif /* LIBXML_OUTPUT_ENABLED */ |
1110 | #define bottom_entities |
1111 | #include "elfgcchack.h" |
1112 | |