1 /* libxml2 - Library for parsing XML documents
2 * Copyright (C) 2006-2019 Free Software Foundation, Inc.
3 *
4 * This file is not part of the GNU gettext program, but is used with
5 * GNU gettext.
6 *
7 * The original copyright notice is as follows:
8 */
9
10 /*
11 * Copyright (C) 1998-2012 Daniel Veillard. All Rights Reserved.
12 *
13 * Permission is hereby granted, free of charge, to any person obtaining a copy
14 * of this software and associated documentation files (the "Software"), to deal
15 * in the Software without restriction, including without limitation the rights
16 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
17 * copies of the Software, and to permit persons to whom the Software is fur-
18 * nished to do so, subject to the following conditions:
19 *
20 * The above copyright notice and this permission notice shall be included in
21 * all copies or substantial portions of the Software.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
24 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FIT-
25 * NESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
26 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
27 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
28 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
29 * THE SOFTWARE.
30 *
31 * daniel@veillard.com
32 */
33
34 /*
35 * entities.c : implementation for the XML entities handling
36 */
37
38 /* To avoid EBCDIC trouble when parsing on zOS */
39 #if defined(__MVS__)
40 #pragma convert("ISO8859-1")
41 #endif
42
43 #define IN_LIBXML
44 #include "libxml.h"
45
46 #include <string.h>
47 #ifdef HAVE_STDLIB_H
48 #include <stdlib.h>
49 #endif
50 #include <libxml/xmlmemory.h>
51 #include <libxml/hash.h>
52 #include <libxml/entities.h>
53 #include <libxml/parser.h>
54 #include <libxml/parserInternals.h>
55 #include <libxml/xmlerror.h>
56 #include <libxml/globals.h>
57 #include <libxml/dict.h>
58
59 #include "save.h"
60
61 /*
62 * The XML predefined entities.
63 */
64
65 static xmlEntity xmlEntityLt = {
66 NULL, XML_ENTITY_DECL, BAD_CAST "lt",
67 NULL, NULL, NULL, NULL, NULL, NULL,
68 BAD_CAST "<", BAD_CAST "<", 1,
69 XML_INTERNAL_PREDEFINED_ENTITY,
70 NULL, NULL, NULL, NULL, 0, 1
71 };
72 static xmlEntity xmlEntityGt = {
73 NULL, XML_ENTITY_DECL, BAD_CAST "gt",
74 NULL, NULL, NULL, NULL, NULL, NULL,
75 BAD_CAST ">", BAD_CAST ">", 1,
76 XML_INTERNAL_PREDEFINED_ENTITY,
77 NULL, NULL, NULL, NULL, 0, 1
78 };
79 static xmlEntity xmlEntityAmp = {
80 NULL, XML_ENTITY_DECL, BAD_CAST "amp",
81 NULL, NULL, NULL, NULL, NULL, NULL,
82 BAD_CAST "&", BAD_CAST "&", 1,
83 XML_INTERNAL_PREDEFINED_ENTITY,
84 NULL, NULL, NULL, NULL, 0, 1
85 };
86 static xmlEntity xmlEntityQuot = {
87 NULL, XML_ENTITY_DECL, BAD_CAST "quot",
88 NULL, NULL, NULL, NULL, NULL, NULL,
89 BAD_CAST "\"", BAD_CAST "\"", 1,
90 XML_INTERNAL_PREDEFINED_ENTITY,
91 NULL, NULL, NULL, NULL, 0, 1
92 };
93 static xmlEntity xmlEntityApos = {
94 NULL, XML_ENTITY_DECL, BAD_CAST "apos",
95 NULL, NULL, NULL, NULL, NULL, NULL,
96 BAD_CAST "'", BAD_CAST "'", 1,
97 XML_INTERNAL_PREDEFINED_ENTITY,
98 NULL, NULL, NULL, NULL, 0, 1
99 };
100
101 /**
102 * xmlEntitiesErrMemory:
103 * @extra: extra informations
104 *
105 * Handle an out of memory condition
106 */
107 static void
xmlEntitiesErrMemory(const char * extra)108 xmlEntitiesErrMemory(const char *extra)
109 {
110 __xmlSimpleError(XML_FROM_TREE, XML_ERR_NO_MEMORY, NULL, NULL, extra);
111 }
112
113 /**
114 * xmlEntitiesErr:
115 * @code: the error code
116 * @msg: the message
117 *
118 * Handle an out of memory condition
119 */
120 static void LIBXML_ATTR_FORMAT(2,0)
xmlEntitiesErr(xmlParserErrors code,const char * msg)121 xmlEntitiesErr(xmlParserErrors code, const char *msg)
122 {
123 __xmlSimpleError(XML_FROM_TREE, code, NULL, msg, NULL);
124 }
125
126 /*
127 * xmlFreeEntity : clean-up an entity record.
128 */
129 static void
xmlFreeEntity(xmlEntityPtr entity)130 xmlFreeEntity(xmlEntityPtr entity)
131 {
132 xmlDictPtr dict = NULL;
133
134 if (entity == NULL)
135 return;
136
137 if (entity->doc != NULL)
138 dict = entity->doc->dict;
139
140
141 if ((entity->children) && (entity->owner == 1) &&
142 (entity == (xmlEntityPtr) entity->children->parent))
143 xmlFreeNodeList(entity->children);
144 if (dict != NULL) {
145 if ((entity->name != NULL) && (!xmlDictOwns(dict, entity->name)))
146 xmlFree((char *) entity->name);
147 if ((entity->ExternalID != NULL) &&
148 (!xmlDictOwns(dict, entity->ExternalID)))
149 xmlFree((char *) entity->ExternalID);
150 if ((entity->SystemID != NULL) &&
151 (!xmlDictOwns(dict, entity->SystemID)))
152 xmlFree((char *) entity->SystemID);
153 if ((entity->URI != NULL) && (!xmlDictOwns(dict, entity->URI)))
154 xmlFree((char *) entity->URI);
155 if ((entity->content != NULL)
156 && (!xmlDictOwns(dict, entity->content)))
157 xmlFree((char *) entity->content);
158 if ((entity->orig != NULL) && (!xmlDictOwns(dict, entity->orig)))
159 xmlFree((char *) entity->orig);
160 } else {
161 if (entity->name != NULL)
162 xmlFree((char *) entity->name);
163 if (entity->ExternalID != NULL)
164 xmlFree((char *) entity->ExternalID);
165 if (entity->SystemID != NULL)
166 xmlFree((char *) entity->SystemID);
167 if (entity->URI != NULL)
168 xmlFree((char *) entity->URI);
169 if (entity->content != NULL)
170 xmlFree((char *) entity->content);
171 if (entity->orig != NULL)
172 xmlFree((char *) entity->orig);
173 }
174 xmlFree(entity);
175 }
176
177 /*
178 * xmlCreateEntity:
179 *
180 * internal routine doing the entity node strutures allocations
181 */
182 static xmlEntityPtr
xmlCreateEntity(xmlDictPtr dict,const xmlChar * name,int type,const xmlChar * ExternalID,const xmlChar * SystemID,const xmlChar * content)183 xmlCreateEntity(xmlDictPtr dict, const xmlChar *name, int type,
184 const xmlChar *ExternalID, const xmlChar *SystemID,
185 const xmlChar *content) {
186 xmlEntityPtr ret;
187
188 ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
189 if (ret == NULL) {
190 xmlEntitiesErrMemory("xmlCreateEntity: malloc failed");
191 return(NULL);
192 }
193 memset(ret, 0, sizeof(xmlEntity));
194 ret->type = XML_ENTITY_DECL;
195 ret->checked = 0;
196
197 /*
198 * fill the structure.
199 */
200 ret->etype = (xmlEntityType) type;
201 if (dict == NULL) {
202 ret->name = xmlStrdup(name);
203 if (ExternalID != NULL)
204 ret->ExternalID = xmlStrdup(ExternalID);
205 if (SystemID != NULL)
206 ret->SystemID = xmlStrdup(SystemID);
207 } else {
208 ret->name = xmlDictLookup(dict, name, -1);
209 if (ExternalID != NULL)
210 ret->ExternalID = xmlDictLookup(dict, ExternalID, -1);
211 if (SystemID != NULL)
212 ret->SystemID = xmlDictLookup(dict, SystemID, -1);
213 }
214 if (content != NULL) {
215 ret->length = xmlStrlen(content);
216 if ((dict != NULL) && (ret->length < 5))
217 ret->content = (xmlChar *)
218 xmlDictLookup(dict, content, ret->length);
219 else
220 ret->content = xmlStrndup(content, ret->length);
221 } else {
222 ret->length = 0;
223 ret->content = NULL;
224 }
225 ret->URI = NULL; /* to be computed by the layer knowing
226 the defining entity */
227 ret->orig = NULL;
228 ret->owner = 0;
229
230 return(ret);
231 }
232
233 /*
234 * xmlAddEntity : register a new entity for an entities table.
235 */
236 static xmlEntityPtr
xmlAddEntity(xmlDtdPtr dtd,const xmlChar * name,int type,const xmlChar * ExternalID,const xmlChar * SystemID,const xmlChar * content)237 xmlAddEntity(xmlDtdPtr dtd, const xmlChar *name, int type,
238 const xmlChar *ExternalID, const xmlChar *SystemID,
239 const xmlChar *content) {
240 xmlDictPtr dict = NULL;
241 xmlEntitiesTablePtr table = NULL;
242 xmlEntityPtr ret;
243
244 if (name == NULL)
245 return(NULL);
246 if (dtd == NULL)
247 return(NULL);
248 if (dtd->doc != NULL)
249 dict = dtd->doc->dict;
250
251 switch (type) {
252 case XML_INTERNAL_GENERAL_ENTITY:
253 case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
254 case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
255 if (dtd->entities == NULL)
256 dtd->entities = xmlHashCreateDict(0, dict);
257 table = dtd->entities;
258 break;
259 case XML_INTERNAL_PARAMETER_ENTITY:
260 case XML_EXTERNAL_PARAMETER_ENTITY:
261 if (dtd->pentities == NULL)
262 dtd->pentities = xmlHashCreateDict(0, dict);
263 table = dtd->pentities;
264 break;
265 case XML_INTERNAL_PREDEFINED_ENTITY:
266 return(NULL);
267 }
268 if (table == NULL)
269 return(NULL);
270 ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
271 if (ret == NULL)
272 return(NULL);
273 ret->doc = dtd->doc;
274
275 if (xmlHashAddEntry(table, name, ret)) {
276 /*
277 * entity was already defined at another level.
278 */
279 xmlFreeEntity(ret);
280 return(NULL);
281 }
282 return(ret);
283 }
284
285 /**
286 * xmlGetPredefinedEntity:
287 * @name: the entity name
288 *
289 * Check whether this name is an predefined entity.
290 *
291 * Returns NULL if not, otherwise the entity
292 */
293 xmlEntityPtr
xmlGetPredefinedEntity(const xmlChar * name)294 xmlGetPredefinedEntity(const xmlChar *name) {
295 if (name == NULL) return(NULL);
296 switch (name[0]) {
297 case 'l':
298 if (xmlStrEqual(name, BAD_CAST "lt"))
299 return(&xmlEntityLt);
300 break;
301 case 'g':
302 if (xmlStrEqual(name, BAD_CAST "gt"))
303 return(&xmlEntityGt);
304 break;
305 case 'a':
306 if (xmlStrEqual(name, BAD_CAST "amp"))
307 return(&xmlEntityAmp);
308 if (xmlStrEqual(name, BAD_CAST "apos"))
309 return(&xmlEntityApos);
310 break;
311 case 'q':
312 if (xmlStrEqual(name, BAD_CAST "quot"))
313 return(&xmlEntityQuot);
314 break;
315 default:
316 break;
317 }
318 return(NULL);
319 }
320
321 /**
322 * xmlAddDtdEntity:
323 * @doc: the document
324 * @name: the entity name
325 * @type: the entity type XML_xxx_yyy_ENTITY
326 * @ExternalID: the entity external ID if available
327 * @SystemID: the entity system ID if available
328 * @content: the entity content
329 *
330 * Register a new entity for this document DTD external subset.
331 *
332 * Returns a pointer to the entity or NULL in case of error
333 */
334 xmlEntityPtr
xmlAddDtdEntity(xmlDocPtr doc,const xmlChar * name,int type,const xmlChar * ExternalID,const xmlChar * SystemID,const xmlChar * content)335 xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
336 const xmlChar *ExternalID, const xmlChar *SystemID,
337 const xmlChar *content) {
338 xmlEntityPtr ret;
339 xmlDtdPtr dtd;
340
341 if (doc == NULL) {
342 xmlEntitiesErr(XML_DTD_NO_DOC,
343 "xmlAddDtdEntity: document is NULL");
344 return(NULL);
345 }
346 if (doc->extSubset == NULL) {
347 xmlEntitiesErr(XML_DTD_NO_DTD,
348 "xmlAddDtdEntity: document without external subset");
349 return(NULL);
350 }
351 dtd = doc->extSubset;
352 ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
353 if (ret == NULL) return(NULL);
354
355 /*
356 * Link it to the DTD
357 */
358 ret->parent = dtd;
359 ret->doc = dtd->doc;
360 if (dtd->last == NULL) {
361 dtd->children = dtd->last = (xmlNodePtr) ret;
362 } else {
363 dtd->last->next = (xmlNodePtr) ret;
364 ret->prev = dtd->last;
365 dtd->last = (xmlNodePtr) ret;
366 }
367 return(ret);
368 }
369
370 /**
371 * xmlAddDocEntity:
372 * @doc: the document
373 * @name: the entity name
374 * @type: the entity type XML_xxx_yyy_ENTITY
375 * @ExternalID: the entity external ID if available
376 * @SystemID: the entity system ID if available
377 * @content: the entity content
378 *
379 * Register a new entity for this document.
380 *
381 * Returns a pointer to the entity or NULL in case of error
382 */
383 xmlEntityPtr
xmlAddDocEntity(xmlDocPtr doc,const xmlChar * name,int type,const xmlChar * ExternalID,const xmlChar * SystemID,const xmlChar * content)384 xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
385 const xmlChar *ExternalID, const xmlChar *SystemID,
386 const xmlChar *content) {
387 xmlEntityPtr ret;
388 xmlDtdPtr dtd;
389
390 if (doc == NULL) {
391 xmlEntitiesErr(XML_DTD_NO_DOC,
392 "xmlAddDocEntity: document is NULL");
393 return(NULL);
394 }
395 if (doc->intSubset == NULL) {
396 xmlEntitiesErr(XML_DTD_NO_DTD,
397 "xmlAddDocEntity: document without internal subset");
398 return(NULL);
399 }
400 dtd = doc->intSubset;
401 ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
402 if (ret == NULL) return(NULL);
403
404 /*
405 * Link it to the DTD
406 */
407 ret->parent = dtd;
408 ret->doc = dtd->doc;
409 if (dtd->last == NULL) {
410 dtd->children = dtd->last = (xmlNodePtr) ret;
411 } else {
412 dtd->last->next = (xmlNodePtr) ret;
413 ret->prev = dtd->last;
414 dtd->last = (xmlNodePtr) ret;
415 }
416 return(ret);
417 }
418
419 /**
420 * xmlNewEntity:
421 * @doc: the document
422 * @name: the entity name
423 * @type: the entity type XML_xxx_yyy_ENTITY
424 * @ExternalID: the entity external ID if available
425 * @SystemID: the entity system ID if available
426 * @content: the entity content
427 *
428 * Create a new entity, this differs from xmlAddDocEntity() that if
429 * the document is NULL or has no internal subset defined, then an
430 * unlinked entity structure will be returned, it is then the responsability
431 * of the caller to link it to the document later or free it when not needed
432 * anymore.
433 *
434 * Returns a pointer to the entity or NULL in case of error
435 */
436 xmlEntityPtr
xmlNewEntity(xmlDocPtr doc,const xmlChar * name,int type,const xmlChar * ExternalID,const xmlChar * SystemID,const xmlChar * content)437 xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
438 const xmlChar *ExternalID, const xmlChar *SystemID,
439 const xmlChar *content) {
440 xmlEntityPtr ret;
441 xmlDictPtr dict;
442
443 if ((doc != NULL) && (doc->intSubset != NULL)) {
444 return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
445 }
446 if (doc != NULL)
447 dict = doc->dict;
448 else
449 dict = NULL;
450 ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
451 if (ret == NULL)
452 return(NULL);
453 ret->doc = doc;
454 return(ret);
455 }
456
457 /**
458 * xmlGetEntityFromTable:
459 * @table: an entity table
460 * @name: the entity name
461 * @parameter: look for parameter entities
462 *
463 * Do an entity lookup in the table.
464 * returns the corresponding parameter entity, if found.
465 *
466 * Returns A pointer to the entity structure or NULL if not found.
467 */
468 static xmlEntityPtr
xmlGetEntityFromTable(xmlEntitiesTablePtr table,const xmlChar * name)469 xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
470 return((xmlEntityPtr) xmlHashLookup(table, name));
471 }
472
473 /**
474 * xmlGetParameterEntity:
475 * @doc: the document referencing the entity
476 * @name: the entity name
477 *
478 * Do an entity lookup in the internal and external subsets and
479 * returns the corresponding parameter entity, if found.
480 *
481 * Returns A pointer to the entity structure or NULL if not found.
482 */
483 xmlEntityPtr
xmlGetParameterEntity(xmlDocPtr doc,const xmlChar * name)484 xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
485 xmlEntitiesTablePtr table;
486 xmlEntityPtr ret;
487
488 if (doc == NULL)
489 return(NULL);
490 if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
491 table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
492 ret = xmlGetEntityFromTable(table, name);
493 if (ret != NULL)
494 return(ret);
495 }
496 if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
497 table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
498 return(xmlGetEntityFromTable(table, name));
499 }
500 return(NULL);
501 }
502
503 /**
504 * xmlGetDtdEntity:
505 * @doc: the document referencing the entity
506 * @name: the entity name
507 *
508 * Do an entity lookup in the DTD entity hash table and
509 * returns the corresponding entity, if found.
510 * Note: the first argument is the document node, not the DTD node.
511 *
512 * Returns A pointer to the entity structure or NULL if not found.
513 */
514 xmlEntityPtr
xmlGetDtdEntity(xmlDocPtr doc,const xmlChar * name)515 xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
516 xmlEntitiesTablePtr table;
517
518 if (doc == NULL)
519 return(NULL);
520 if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
521 table = (xmlEntitiesTablePtr) doc->extSubset->entities;
522 return(xmlGetEntityFromTable(table, name));
523 }
524 return(NULL);
525 }
526
527 /**
528 * xmlGetDocEntity:
529 * @doc: the document referencing the entity
530 * @name: the entity name
531 *
532 * Do an entity lookup in the document entity hash table and
533 * returns the corresponding entity, otherwise a lookup is done
534 * in the predefined entities too.
535 *
536 * Returns A pointer to the entity structure or NULL if not found.
537 */
538 xmlEntityPtr
xmlGetDocEntity(const xmlDoc * doc,const xmlChar * name)539 xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
540 xmlEntityPtr cur;
541 xmlEntitiesTablePtr table;
542
543 if (doc != NULL) {
544 if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
545 table = (xmlEntitiesTablePtr) doc->intSubset->entities;
546 cur = xmlGetEntityFromTable(table, name);
547 if (cur != NULL)
548 return(cur);
549 }
550 if (doc->standalone != 1) {
551 if ((doc->extSubset != NULL) &&
552 (doc->extSubset->entities != NULL)) {
553 table = (xmlEntitiesTablePtr) doc->extSubset->entities;
554 cur = xmlGetEntityFromTable(table, name);
555 if (cur != NULL)
556 return(cur);
557 }
558 }
559 }
560 return(xmlGetPredefinedEntity(name));
561 }
562
563 /*
564 * Macro used to grow the current buffer.
565 */
566 #define growBufferReentrant() { \
567 xmlChar *tmp; \
568 size_t new_size = buffer_size * 2; \
569 if (new_size < buffer_size) goto mem_error; \
570 tmp = (xmlChar *) xmlRealloc(buffer, new_size); \
571 if (tmp == NULL) goto mem_error; \
572 buffer = tmp; \
573 buffer_size = new_size; \
574 }
575
576 /**
577 * xmlEncodeEntitiesInternal:
578 * @doc: the document containing the string
579 * @input: A string to convert to XML.
580 * @attr: are we handling an atrbute value
581 *
582 * Do a global encoding of a string, replacing the predefined entities
583 * and non ASCII values with their entities and CharRef counterparts.
584 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
585 * must be deallocated.
586 *
587 * Returns A newly allocated string with the substitution done.
588 */
589 static xmlChar *
xmlEncodeEntitiesInternal(xmlDocPtr doc,const xmlChar * input,int attr)590 xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input, int attr) {
591 const xmlChar *cur = input;
592 xmlChar *buffer = NULL;
593 xmlChar *out = NULL;
594 size_t buffer_size = 0;
595 int html = 0;
596
597 if (input == NULL) return(NULL);
598 if (doc != NULL)
599 html = (doc->type == XML_HTML_DOCUMENT_NODE);
600
601 /*
602 * allocate an translation buffer.
603 */
604 buffer_size = 1000;
605 buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
606 if (buffer == NULL) {
607 xmlEntitiesErrMemory("xmlEncodeEntities: malloc failed");
608 return(NULL);
609 }
610 out = buffer;
611
612 while (*cur != '\0') {
613 size_t indx = out - buffer;
614 if (indx + 100 > buffer_size) {
615
616 growBufferReentrant();
617 out = &buffer[indx];
618 }
619
620 /*
621 * By default one have to encode at least '<', '>', '"' and '&' !
622 */
623 if (*cur == '<') {
624 const xmlChar *end;
625
626 /*
627 * Special handling of server side include in HTML attributes
628 */
629 if (html && attr &&
630 (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
631 ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
632 while (cur != end) {
633 *out++ = *cur++;
634 indx = out - buffer;
635 if (indx + 100 > buffer_size) {
636 growBufferReentrant();
637 out = &buffer[indx];
638 }
639 }
640 *out++ = *cur++;
641 *out++ = *cur++;
642 *out++ = *cur++;
643 continue;
644 }
645 *out++ = '&';
646 *out++ = 'l';
647 *out++ = 't';
648 *out++ = ';';
649 } else if (*cur == '>') {
650 *out++ = '&';
651 *out++ = 'g';
652 *out++ = 't';
653 *out++ = ';';
654 } else if (*cur == '&') {
655 /*
656 * Special handling of &{...} construct from HTML 4, see
657 * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
658 */
659 if (html && attr && (cur[1] == '{') &&
660 (strchr((const char *) cur, '}'))) {
661 while (*cur != '}') {
662 *out++ = *cur++;
663 indx = out - buffer;
664 if (indx + 100 > buffer_size) {
665 growBufferReentrant();
666 out = &buffer[indx];
667 }
668 }
669 *out++ = *cur++;
670 continue;
671 }
672 *out++ = '&';
673 *out++ = 'a';
674 *out++ = 'm';
675 *out++ = 'p';
676 *out++ = ';';
677 } else if (((*cur >= 0x20) && (*cur < 0x80)) ||
678 (*cur == '\n') || (*cur == '\t') || ((html) && (*cur == '\r'))) {
679 /*
680 * default case, just copy !
681 */
682 *out++ = *cur;
683 } else if (*cur >= 0x80) {
684 if (((doc != NULL) && (doc->encoding != NULL)) || (html)) {
685 /*
686 * Bjørn Reese <br@sseusa.com> provided the patch
687 xmlChar xc;
688 xc = (*cur & 0x3F) << 6;
689 if (cur[1] != 0) {
690 xc += *(++cur) & 0x3F;
691 *out++ = xc;
692 } else
693 */
694 *out++ = *cur;
695 } else {
696 /*
697 * We assume we have UTF-8 input.
698 */
699 char buf[11], *ptr;
700 int val = 0, l = 1;
701
702 if (*cur < 0xC0) {
703 xmlEntitiesErr(XML_CHECK_NOT_UTF8,
704 "xmlEncodeEntities: input not UTF-8");
705 if (doc != NULL)
706 doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
707 snprintf(buf, sizeof(buf), "&#%d;", *cur);
708 buf[sizeof(buf) - 1] = 0;
709 ptr = buf;
710 while (*ptr != 0) *out++ = *ptr++;
711 cur++;
712 continue;
713 } else if (*cur < 0xE0) {
714 val = (cur[0]) & 0x1F;
715 val <<= 6;
716 val |= (cur[1]) & 0x3F;
717 l = 2;
718 } else if (*cur < 0xF0) {
719 val = (cur[0]) & 0x0F;
720 val <<= 6;
721 val |= (cur[1]) & 0x3F;
722 val <<= 6;
723 val |= (cur[2]) & 0x3F;
724 l = 3;
725 } else if (*cur < 0xF8) {
726 val = (cur[0]) & 0x07;
727 val <<= 6;
728 val |= (cur[1]) & 0x3F;
729 val <<= 6;
730 val |= (cur[2]) & 0x3F;
731 val <<= 6;
732 val |= (cur[3]) & 0x3F;
733 l = 4;
734 }
735 if ((l == 1) || (!IS_CHAR(val))) {
736 xmlEntitiesErr(XML_ERR_INVALID_CHAR,
737 "xmlEncodeEntities: char out of range\n");
738 if (doc != NULL)
739 doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
740 snprintf(buf, sizeof(buf), "&#%d;", *cur);
741 buf[sizeof(buf) - 1] = 0;
742 ptr = buf;
743 while (*ptr != 0) *out++ = *ptr++;
744 cur++;
745 continue;
746 }
747 /*
748 * We could do multiple things here. Just save as a char ref
749 */
750 snprintf(buf, sizeof(buf), "&#x%X;", val);
751 buf[sizeof(buf) - 1] = 0;
752 ptr = buf;
753 while (*ptr != 0) *out++ = *ptr++;
754 cur += l;
755 continue;
756 }
757 } else if (IS_BYTE_CHAR(*cur)) {
758 char buf[11], *ptr;
759
760 snprintf(buf, sizeof(buf), "&#%d;", *cur);
761 buf[sizeof(buf) - 1] = 0;
762 ptr = buf;
763 while (*ptr != 0) *out++ = *ptr++;
764 }
765 cur++;
766 }
767 *out = 0;
768 return(buffer);
769
770 mem_error:
771 xmlEntitiesErrMemory("xmlEncodeEntities: realloc failed");
772 xmlFree(buffer);
773 return(NULL);
774 }
775
776 /**
777 * xmlEncodeAttributeEntities:
778 * @doc: the document containing the string
779 * @input: A string to convert to XML.
780 *
781 * Do a global encoding of a string, replacing the predefined entities
782 * and non ASCII values with their entities and CharRef counterparts for
783 * attribute values.
784 *
785 * Returns A newly allocated string with the substitution done.
786 */
787 xmlChar *
xmlEncodeAttributeEntities(xmlDocPtr doc,const xmlChar * input)788 xmlEncodeAttributeEntities(xmlDocPtr doc, const xmlChar *input) {
789 return xmlEncodeEntitiesInternal(doc, input, 1);
790 }
791
792 /**
793 * xmlEncodeEntitiesReentrant:
794 * @doc: the document containing the string
795 * @input: A string to convert to XML.
796 *
797 * Do a global encoding of a string, replacing the predefined entities
798 * and non ASCII values with their entities and CharRef counterparts.
799 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
800 * must be deallocated.
801 *
802 * Returns A newly allocated string with the substitution done.
803 */
804 xmlChar *
xmlEncodeEntitiesReentrant(xmlDocPtr doc,const xmlChar * input)805 xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
806 return xmlEncodeEntitiesInternal(doc, input, 0);
807 }
808
809 /**
810 * xmlEncodeSpecialChars:
811 * @doc: the document containing the string
812 * @input: A string to convert to XML.
813 *
814 * Do a global encoding of a string, replacing the predefined entities
815 * this routine is reentrant, and result must be deallocated.
816 *
817 * Returns A newly allocated string with the substitution done.
818 */
819 xmlChar *
xmlEncodeSpecialChars(const xmlDoc * doc ATTRIBUTE_UNUSED,const xmlChar * input)820 xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED, const xmlChar *input) {
821 const xmlChar *cur = input;
822 xmlChar *buffer = NULL;
823 xmlChar *out = NULL;
824 size_t buffer_size = 0;
825 if (input == NULL) return(NULL);
826
827 /*
828 * allocate an translation buffer.
829 */
830 buffer_size = 1000;
831 buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
832 if (buffer == NULL) {
833 xmlEntitiesErrMemory("xmlEncodeSpecialChars: malloc failed");
834 return(NULL);
835 }
836 out = buffer;
837
838 while (*cur != '\0') {
839 size_t indx = out - buffer;
840 if (indx + 10 > buffer_size) {
841
842 growBufferReentrant();
843 out = &buffer[indx];
844 }
845
846 /*
847 * By default one have to encode at least '<', '>', '"' and '&' !
848 */
849 if (*cur == '<') {
850 *out++ = '&';
851 *out++ = 'l';
852 *out++ = 't';
853 *out++ = ';';
854 } else if (*cur == '>') {
855 *out++ = '&';
856 *out++ = 'g';
857 *out++ = 't';
858 *out++ = ';';
859 } else if (*cur == '&') {
860 *out++ = '&';
861 *out++ = 'a';
862 *out++ = 'm';
863 *out++ = 'p';
864 *out++ = ';';
865 } else if (*cur == '"') {
866 *out++ = '&';
867 *out++ = 'q';
868 *out++ = 'u';
869 *out++ = 'o';
870 *out++ = 't';
871 *out++ = ';';
872 } else if (*cur == '\r') {
873 *out++ = '&';
874 *out++ = '#';
875 *out++ = '1';
876 *out++ = '3';
877 *out++ = ';';
878 } else {
879 /*
880 * Works because on UTF-8, all extended sequences cannot
881 * result in bytes in the ASCII range.
882 */
883 *out++ = *cur;
884 }
885 cur++;
886 }
887 *out = 0;
888 return(buffer);
889
890 mem_error:
891 xmlEntitiesErrMemory("xmlEncodeSpecialChars: realloc failed");
892 xmlFree(buffer);
893 return(NULL);
894 }
895
896 /**
897 * xmlCreateEntitiesTable:
898 *
899 * create and initialize an empty entities hash table.
900 * This really doesn't make sense and should be deprecated
901 *
902 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
903 */
904 xmlEntitiesTablePtr
xmlCreateEntitiesTable(void)905 xmlCreateEntitiesTable(void) {
906 return((xmlEntitiesTablePtr) xmlHashCreate(0));
907 }
908
909 /**
910 * xmlFreeEntityWrapper:
911 * @entity: An entity
912 * @name: its name
913 *
914 * Deallocate the memory used by an entities in the hash table.
915 */
916 static void
xmlFreeEntityWrapper(void * entity,const xmlChar * name ATTRIBUTE_UNUSED)917 xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
918 if (entity != NULL)
919 xmlFreeEntity((xmlEntityPtr) entity);
920 }
921
922 /**
923 * xmlFreeEntitiesTable:
924 * @table: An entity table
925 *
926 * Deallocate the memory used by an entities hash table.
927 */
928 void
xmlFreeEntitiesTable(xmlEntitiesTablePtr table)929 xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
930 xmlHashFree(table, xmlFreeEntityWrapper);
931 }
932
933 #ifdef LIBXML_TREE_ENABLED
934 /**
935 * xmlCopyEntity:
936 * @ent: An entity
937 *
938 * Build a copy of an entity
939 *
940 * Returns the new xmlEntitiesPtr or NULL in case of error.
941 */
942 static void *
xmlCopyEntity(void * payload,const xmlChar * name ATTRIBUTE_UNUSED)943 xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
944 xmlEntityPtr ent = (xmlEntityPtr) payload;
945 xmlEntityPtr cur;
946
947 cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
948 if (cur == NULL) {
949 xmlEntitiesErrMemory("xmlCopyEntity:: malloc failed");
950 return(NULL);
951 }
952 memset(cur, 0, sizeof(xmlEntity));
953 cur->type = XML_ENTITY_DECL;
954
955 cur->etype = ent->etype;
956 if (ent->name != NULL)
957 cur->name = xmlStrdup(ent->name);
958 if (ent->ExternalID != NULL)
959 cur->ExternalID = xmlStrdup(ent->ExternalID);
960 if (ent->SystemID != NULL)
961 cur->SystemID = xmlStrdup(ent->SystemID);
962 if (ent->content != NULL)
963 cur->content = xmlStrdup(ent->content);
964 if (ent->orig != NULL)
965 cur->orig = xmlStrdup(ent->orig);
966 if (ent->URI != NULL)
967 cur->URI = xmlStrdup(ent->URI);
968 return(cur);
969 }
970
971 /**
972 * xmlCopyEntitiesTable:
973 * @table: An entity table
974 *
975 * Build a copy of an entity table.
976 *
977 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
978 */
979 xmlEntitiesTablePtr
xmlCopyEntitiesTable(xmlEntitiesTablePtr table)980 xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
981 return(xmlHashCopy(table, xmlCopyEntity));
982 }
983 #endif /* LIBXML_TREE_ENABLED */
984
985 #ifdef LIBXML_OUTPUT_ENABLED
986
987 /**
988 * xmlDumpEntityContent:
989 * @buf: An XML buffer.
990 * @content: The entity content.
991 *
992 * This will dump the quoted string value, taking care of the special
993 * treatment required by %
994 */
995 static void
xmlDumpEntityContent(xmlBufferPtr buf,const xmlChar * content)996 xmlDumpEntityContent(xmlBufferPtr buf, const xmlChar *content) {
997 if (buf->alloc == XML_BUFFER_ALLOC_IMMUTABLE) return;
998 if (xmlStrchr(content, '%')) {
999 const xmlChar * base, *cur;
1000
1001 xmlBufferCCat(buf, "\"");
1002 base = cur = content;
1003 while (*cur != 0) {
1004 if (*cur == '"') {
1005 if (base != cur)
1006 xmlBufferAdd(buf, base, cur - base);
1007 xmlBufferAdd(buf, BAD_CAST """, 6);
1008 cur++;
1009 base = cur;
1010 } else if (*cur == '%') {
1011 if (base != cur)
1012 xmlBufferAdd(buf, base, cur - base);
1013 xmlBufferAdd(buf, BAD_CAST "%", 6);
1014 cur++;
1015 base = cur;
1016 } else {
1017 cur++;
1018 }
1019 }
1020 if (base != cur)
1021 xmlBufferAdd(buf, base, cur - base);
1022 xmlBufferCCat(buf, "\"");
1023 } else {
1024 xmlBufferWriteQuotedString(buf, content);
1025 }
1026 }
1027
1028 /**
1029 * xmlDumpEntityDecl:
1030 * @buf: An XML buffer.
1031 * @ent: An entity table
1032 *
1033 * This will dump the content of the entity table as an XML DTD definition
1034 */
1035 void
xmlDumpEntityDecl(xmlBufferPtr buf,xmlEntityPtr ent)1036 xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
1037 if ((buf == NULL) || (ent == NULL)) return;
1038 switch (ent->etype) {
1039 case XML_INTERNAL_GENERAL_ENTITY:
1040 xmlBufferWriteChar(buf, "<!ENTITY ");
1041 xmlBufferWriteCHAR(buf, ent->name);
1042 xmlBufferWriteChar(buf, " ");
1043 if (ent->orig != NULL)
1044 xmlBufferWriteQuotedString(buf, ent->orig);
1045 else
1046 xmlDumpEntityContent(buf, ent->content);
1047 xmlBufferWriteChar(buf, ">\n");
1048 break;
1049 case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
1050 xmlBufferWriteChar(buf, "<!ENTITY ");
1051 xmlBufferWriteCHAR(buf, ent->name);
1052 if (ent->ExternalID != NULL) {
1053 xmlBufferWriteChar(buf, " PUBLIC ");
1054 xmlBufferWriteQuotedString(buf, ent->ExternalID);
1055 xmlBufferWriteChar(buf, " ");
1056 xmlBufferWriteQuotedString(buf, ent->SystemID);
1057 } else {
1058 xmlBufferWriteChar(buf, " SYSTEM ");
1059 xmlBufferWriteQuotedString(buf, ent->SystemID);
1060 }
1061 xmlBufferWriteChar(buf, ">\n");
1062 break;
1063 case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
1064 xmlBufferWriteChar(buf, "<!ENTITY ");
1065 xmlBufferWriteCHAR(buf, ent->name);
1066 if (ent->ExternalID != NULL) {
1067 xmlBufferWriteChar(buf, " PUBLIC ");
1068 xmlBufferWriteQuotedString(buf, ent->ExternalID);
1069 xmlBufferWriteChar(buf, " ");
1070 xmlBufferWriteQuotedString(buf, ent->SystemID);
1071 } else {
1072 xmlBufferWriteChar(buf, " SYSTEM ");
1073 xmlBufferWriteQuotedString(buf, ent->SystemID);
1074 }
1075 if (ent->content != NULL) { /* Should be true ! */
1076 xmlBufferWriteChar(buf, " NDATA ");
1077 if (ent->orig != NULL)
1078 xmlBufferWriteCHAR(buf, ent->orig);
1079 else
1080 xmlBufferWriteCHAR(buf, ent->content);
1081 }
1082 xmlBufferWriteChar(buf, ">\n");
1083 break;
1084 case XML_INTERNAL_PARAMETER_ENTITY:
1085 xmlBufferWriteChar(buf, "<!ENTITY % ");
1086 xmlBufferWriteCHAR(buf, ent->name);
1087 xmlBufferWriteChar(buf, " ");
1088 if (ent->orig == NULL)
1089 xmlDumpEntityContent(buf, ent->content);
1090 else
1091 xmlBufferWriteQuotedString(buf, ent->orig);
1092 xmlBufferWriteChar(buf, ">\n");
1093 break;
1094 case XML_EXTERNAL_PARAMETER_ENTITY:
1095 xmlBufferWriteChar(buf, "<!ENTITY % ");
1096 xmlBufferWriteCHAR(buf, ent->name);
1097 if (ent->ExternalID != NULL) {
1098 xmlBufferWriteChar(buf, " PUBLIC ");
1099 xmlBufferWriteQuotedString(buf, ent->ExternalID);
1100 xmlBufferWriteChar(buf, " ");
1101 xmlBufferWriteQuotedString(buf, ent->SystemID);
1102 } else {
1103 xmlBufferWriteChar(buf, " SYSTEM ");
1104 xmlBufferWriteQuotedString(buf, ent->SystemID);
1105 }
1106 xmlBufferWriteChar(buf, ">\n");
1107 break;
1108 default:
1109 xmlEntitiesErr(XML_DTD_UNKNOWN_ENTITY,
1110 "xmlDumpEntitiesDecl: internal: unknown type entity type");
1111 }
1112 }
1113
1114 /**
1115 * xmlDumpEntityDeclScan:
1116 * @ent: An entity table
1117 * @buf: An XML buffer.
1118 *
1119 * When using the hash table scan function, arguments need to be reversed
1120 */
1121 static void
xmlDumpEntityDeclScan(void * ent,void * buf,const xmlChar * name ATTRIBUTE_UNUSED)1122 xmlDumpEntityDeclScan(void *ent, void *buf,
1123 const xmlChar *name ATTRIBUTE_UNUSED) {
1124 xmlDumpEntityDecl((xmlBufferPtr) buf, (xmlEntityPtr) ent);
1125 }
1126
1127 /**
1128 * xmlDumpEntitiesTable:
1129 * @buf: An XML buffer.
1130 * @table: An entity table
1131 *
1132 * This will dump the content of the entity table as an XML DTD definition
1133 */
1134 void
xmlDumpEntitiesTable(xmlBufferPtr buf,xmlEntitiesTablePtr table)1135 xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1136 xmlHashScan(table, xmlDumpEntityDeclScan, buf);
1137 }
1138 #endif /* LIBXML_OUTPUT_ENABLED */
1139 #define bottom_entities
1140 #include "elfgcchack.h"
1141