1 | /* This file is included! |
2 | __ __ _ |
3 | ___\ \/ /_ __ __ _| |_ |
4 | / _ \\ /| '_ \ / _` | __| |
5 | | __// \| |_) | (_| | |_ |
6 | \___/_/\_\ .__/ \__,_|\__| |
7 | |_| XML parser |
8 | |
9 | Copyright (c) 1997-2000 Thai Open Source Software Center Ltd |
10 | Copyright (c) 2000 Clark Cooper <[email protected]> |
11 | Copyright (c) 2002 Greg Stein <[email protected]> |
12 | Copyright (c) 2002 Fred L. Drake, Jr. <[email protected]> |
13 | Copyright (c) 2002-2006 Karl Waclawek <[email protected]> |
14 | Copyright (c) 2017-2021 Sebastian Pipping <[email protected]> |
15 | Licensed under the MIT license: |
16 | |
17 | Permission is hereby granted, free of charge, to any person obtaining |
18 | a copy of this software and associated documentation files (the |
19 | "Software"), to deal in the Software without restriction, including |
20 | without limitation the rights to use, copy, modify, merge, publish, |
21 | distribute, sublicense, and/or sell copies of the Software, and to permit |
22 | persons to whom the Software is furnished to do so, subject to the |
23 | following conditions: |
24 | |
25 | The above copyright notice and this permission notice shall be included |
26 | in all copies or substantial portions of the Software. |
27 | |
28 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
29 | EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
30 | MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN |
31 | NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, |
32 | DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR |
33 | OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE |
34 | USE OR OTHER DEALINGS IN THE SOFTWARE. |
35 | */ |
36 | |
37 | #ifdef XML_TOK_NS_C |
38 | |
39 | const ENCODING * |
40 | NS(XmlGetUtf8InternalEncoding)(void) { |
41 | return &ns(internal_utf8_encoding).enc; |
42 | } |
43 | |
44 | const ENCODING * |
45 | NS(XmlGetUtf16InternalEncoding)(void) { |
46 | # if BYTEORDER == 1234 |
47 | return &ns(internal_little2_encoding).enc; |
48 | # elif BYTEORDER == 4321 |
49 | return &ns(internal_big2_encoding).enc; |
50 | # else |
51 | const short n = 1; |
52 | return (*(const char *)&n ? &ns(internal_little2_encoding).enc |
53 | : &ns(internal_big2_encoding).enc); |
54 | # endif |
55 | } |
56 | |
57 | static const ENCODING *const NS(encodings)[] = { |
58 | &ns(latin1_encoding).enc, &ns(ascii_encoding).enc, |
59 | &ns(utf8_encoding).enc, &ns(big2_encoding).enc, |
60 | &ns(big2_encoding).enc, &ns(little2_encoding).enc, |
61 | &ns(utf8_encoding).enc /* NO_ENC */ |
62 | }; |
63 | |
64 | static int PTRCALL |
65 | NS(initScanProlog)(const ENCODING *enc, const char *ptr, const char *end, |
66 | const char **nextTokPtr) { |
67 | return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_PROLOG_STATE, |
68 | ptr, end, nextTokPtr); |
69 | } |
70 | |
71 | static int PTRCALL |
72 | NS(initScanContent)(const ENCODING *enc, const char *ptr, const char *end, |
73 | const char **nextTokPtr) { |
74 | return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_CONTENT_STATE, |
75 | ptr, end, nextTokPtr); |
76 | } |
77 | |
78 | int |
79 | NS(XmlInitEncoding)(INIT_ENCODING *p, const ENCODING **encPtr, |
80 | const char *name) { |
81 | int i = getEncodingIndex(name); |
82 | if (i == UNKNOWN_ENC) |
83 | return 0; |
84 | SET_INIT_ENC_INDEX(p, i); |
85 | p->initEnc.scanners[XML_PROLOG_STATE] = NS(initScanProlog); |
86 | p->initEnc.scanners[XML_CONTENT_STATE] = NS(initScanContent); |
87 | p->initEnc.updatePosition = initUpdatePosition; |
88 | p->encPtr = encPtr; |
89 | *encPtr = &(p->initEnc); |
90 | return 1; |
91 | } |
92 | |
93 | static const ENCODING * |
94 | NS(findEncoding)(const ENCODING *enc, const char *ptr, const char *end) { |
95 | # define ENCODING_MAX 128 |
96 | char buf[ENCODING_MAX] = "" ; |
97 | char *p = buf; |
98 | int i; |
99 | XmlUtf8Convert(enc, &ptr, end, &p, p + ENCODING_MAX - 1); |
100 | if (ptr != end) |
101 | return 0; |
102 | *p = 0; |
103 | if (streqci(buf, KW_UTF_16) && enc->minBytesPerChar == 2) |
104 | return enc; |
105 | i = getEncodingIndex(buf); |
106 | if (i == UNKNOWN_ENC) |
107 | return 0; |
108 | return NS(encodings)[i]; |
109 | } |
110 | |
111 | int |
112 | NS(XmlParseXmlDecl)(int isGeneralTextEntity, const ENCODING *enc, |
113 | const char *ptr, const char *end, const char **badPtr, |
114 | const char **versionPtr, const char **versionEndPtr, |
115 | const char **encodingName, const ENCODING **encoding, |
116 | int *standalone) { |
117 | return doParseXmlDecl(NS(findEncoding), isGeneralTextEntity, enc, ptr, end, |
118 | badPtr, versionPtr, versionEndPtr, encodingName, |
119 | encoding, standalone); |
120 | } |
121 | |
122 | #endif /* XML_TOK_NS_C */ |
123 | |