1 /* This file is included!
2 __ __ _
3 ___\ \/ /_ __ __ _| |_
4 / _ \\ /| '_ \ / _` | __|
5 | __// \| |_) | (_| | |_
6 \___/_/\_\ .__/ \__,_|\__|
7 |_| XML parser
8
9 Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
10 Copyright (c) 2000 Clark Cooper <coopercc@users.sourceforge.net>
11 Copyright (c) 2002 Greg Stein <gstein@users.sourceforge.net>
12 Copyright (c) 2002 Fred L. Drake, Jr. <fdrake@users.sourceforge.net>
13 Copyright (c) 2002-2006 Karl Waclawek <karl@waclawek.net>
14 Copyright (c) 2017 Sebastian Pipping <sebastian@pipping.org>
15 Licensed under the MIT license:
16
17 Permission is hereby granted, free of charge, to any person obtaining
18 a copy of this software and associated documentation files (the
19 "Software"), to deal in the Software without restriction, including
20 without limitation the rights to use, copy, modify, merge, publish,
21 distribute, sublicense, and/or sell copies of the Software, and to permit
22 persons to whom the Software is furnished to do so, subject to the
23 following conditions:
24
25 The above copyright notice and this permission notice shall be included
26 in all copies or substantial portions of the Software.
27
28 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
29 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
30 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
31 NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
32 DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
33 OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
34 USE OR OTHER DEALINGS IN THE SOFTWARE.
35 */
36
37 #ifdef XML_TOK_NS_C
38
39 const ENCODING *
NS(XmlGetUtf8InternalEncoding)40 NS(XmlGetUtf8InternalEncoding)(void) {
41 return &ns(internal_utf8_encoding).enc;
42 }
43
44 const ENCODING *
NS(XmlGetUtf16InternalEncoding)45 NS(XmlGetUtf16InternalEncoding)(void) {
46 # if BYTEORDER == 1234
47 return &ns(internal_little2_encoding).enc;
48 # elif BYTEORDER == 4321
49 return &ns(internal_big2_encoding).enc;
50 # else
51 const short n = 1;
52 return (*(const char *)&n ? &ns(internal_little2_encoding).enc
53 : &ns(internal_big2_encoding).enc);
54 # endif
55 }
56
57 static const ENCODING *const NS(encodings)[] = {
58 &ns(latin1_encoding).enc, &ns(ascii_encoding).enc,
59 &ns(utf8_encoding).enc, &ns(big2_encoding).enc,
60 &ns(big2_encoding).enc, &ns(little2_encoding).enc,
61 &ns(utf8_encoding).enc /* NO_ENC */
62 };
63
64 static int PTRCALL
NS(initScanProlog)65 NS(initScanProlog)(const ENCODING *enc, const char *ptr, const char *end,
66 const char **nextTokPtr) {
67 return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_PROLOG_STATE,
68 ptr, end, nextTokPtr);
69 }
70
71 static int PTRCALL
NS(initScanContent)72 NS(initScanContent)(const ENCODING *enc, const char *ptr, const char *end,
73 const char **nextTokPtr) {
74 return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_CONTENT_STATE,
75 ptr, end, nextTokPtr);
76 }
77
78 int
NS(XmlInitEncoding)79 NS(XmlInitEncoding)(INIT_ENCODING *p, const ENCODING **encPtr,
80 const char *name) {
81 int i = getEncodingIndex(name);
82 if (i == UNKNOWN_ENC)
83 return 0;
84 SET_INIT_ENC_INDEX(p, i);
85 p->initEnc.scanners[XML_PROLOG_STATE] = NS(initScanProlog);
86 p->initEnc.scanners[XML_CONTENT_STATE] = NS(initScanContent);
87 p->initEnc.updatePosition = initUpdatePosition;
88 p->encPtr = encPtr;
89 *encPtr = &(p->initEnc);
90 return 1;
91 }
92
93 static const ENCODING *
NS(findEncoding)94 NS(findEncoding)(const ENCODING *enc, const char *ptr, const char *end) {
95 # define ENCODING_MAX 128
96 char buf[ENCODING_MAX];
97 char *p = buf;
98 int i;
99 XmlUtf8Convert(enc, &ptr, end, &p, p + ENCODING_MAX - 1);
100 if (ptr != end)
101 return 0;
102 *p = 0;
103 if (streqci(buf, KW_UTF_16) && enc->minBytesPerChar == 2)
104 return enc;
105 i = getEncodingIndex(buf);
106 if (i == UNKNOWN_ENC)
107 return 0;
108 return NS(encodings)[i];
109 }
110
111 int
NS(XmlParseXmlDecl)112 NS(XmlParseXmlDecl)(int isGeneralTextEntity, const ENCODING *enc,
113 const char *ptr, const char *end, const char **badPtr,
114 const char **versionPtr, const char **versionEndPtr,
115 const char **encodingName, const ENCODING **encoding,
116 int *standalone) {
117 return doParseXmlDecl(NS(findEncoding), isGeneralTextEntity, enc, ptr, end,
118 badPtr, versionPtr, versionEndPtr, encodingName,
119 encoding, standalone);
120 }
121
122 #endif /* XML_TOK_NS_C */
123