blob: 919c74e9f97fe8129aacc514217c94f89dd86109 [file] [log] [blame]
Victor Stinner759e30e2017-09-05 01:58:08 +02001/* This file is included!
2 __ __ _
3 ___\ \/ /_ __ __ _| |_
4 / _ \\ /| '_ \ / _` | __|
5 | __// \| |_) | (_| | |_
6 \___/_/\_\ .__/ \__,_|\__|
7 |_| XML parser
8
9 Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
10 Copyright (c) 2000-2017 Expat development team
11 Licensed under the MIT license:
12
13 Permission is hereby granted, free of charge, to any person obtaining
14 a copy of this software and associated documentation files (the
15 "Software"), to deal in the Software without restriction, including
16 without limitation the rights to use, copy, modify, merge, publish,
17 distribute, sublicense, and/or sell copies of the Software, and to permit
18 persons to whom the Software is furnished to do so, subject to the
19 following conditions:
20
21 The above copyright notice and this permission notice shall be included
22 in all copies or substantial portions of the Software.
23
24 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
27 NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
28 DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
29 OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
30 USE OR OTHER DEALINGS IN THE SOFTWARE.
Gregory P. Smith7c6309c2012-07-14 14:12:35 -070031*/
32
Gregory P. Smith7c6309c2012-07-14 14:12:35 -070033#ifdef XML_TOK_NS_C
34
Martin v. Löwisfc03a942003-01-25 22:41:29 +000035const ENCODING *
Benjamin Peterson52b94082019-09-25 21:33:58 -070036NS(XmlGetUtf8InternalEncoding)(void) {
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000037 return &ns(internal_utf8_encoding).enc;
38}
39
Martin v. Löwisfc03a942003-01-25 22:41:29 +000040const ENCODING *
Benjamin Peterson52b94082019-09-25 21:33:58 -070041NS(XmlGetUtf16InternalEncoding)(void) {
42# if BYTEORDER == 1234
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000043 return &ns(internal_little2_encoding).enc;
Benjamin Peterson52b94082019-09-25 21:33:58 -070044# elif BYTEORDER == 4321
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000045 return &ns(internal_big2_encoding).enc;
Benjamin Peterson52b94082019-09-25 21:33:58 -070046# else
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000047 const short n = 1;
Benjamin Peterson52b94082019-09-25 21:33:58 -070048 return (*(const char *)&n ? &ns(internal_little2_encoding).enc
49 : &ns(internal_big2_encoding).enc);
50# endif
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000051}
52
Benjamin Peterson52b94082019-09-25 21:33:58 -070053static const ENCODING *const NS(encodings)[] = {
54 &ns(latin1_encoding).enc, &ns(ascii_encoding).enc,
55 &ns(utf8_encoding).enc, &ns(big2_encoding).enc,
56 &ns(big2_encoding).enc, &ns(little2_encoding).enc,
57 &ns(utf8_encoding).enc /* NO_ENC */
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000058};
59
Martin v. Löwisfc03a942003-01-25 22:41:29 +000060static int PTRCALL
61NS(initScanProlog)(const ENCODING *enc, const char *ptr, const char *end,
Benjamin Peterson52b94082019-09-25 21:33:58 -070062 const char **nextTokPtr) {
63 return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_PROLOG_STATE,
64 ptr, end, nextTokPtr);
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000065}
66
Martin v. Löwisfc03a942003-01-25 22:41:29 +000067static int PTRCALL
68NS(initScanContent)(const ENCODING *enc, const char *ptr, const char *end,
Benjamin Peterson52b94082019-09-25 21:33:58 -070069 const char **nextTokPtr) {
70 return initScan(NS(encodings), (const INIT_ENCODING *)enc, XML_CONTENT_STATE,
71 ptr, end, nextTokPtr);
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000072}
73
Martin v. Löwisfc03a942003-01-25 22:41:29 +000074int
75NS(XmlInitEncoding)(INIT_ENCODING *p, const ENCODING **encPtr,
Benjamin Peterson52b94082019-09-25 21:33:58 -070076 const char *name) {
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000077 int i = getEncodingIndex(name);
78 if (i == UNKNOWN_ENC)
79 return 0;
80 SET_INIT_ENC_INDEX(p, i);
81 p->initEnc.scanners[XML_PROLOG_STATE] = NS(initScanProlog);
82 p->initEnc.scanners[XML_CONTENT_STATE] = NS(initScanContent);
83 p->initEnc.updatePosition = initUpdatePosition;
84 p->encPtr = encPtr;
85 *encPtr = &(p->initEnc);
86 return 1;
87}
88
Martin v. Löwisfc03a942003-01-25 22:41:29 +000089static const ENCODING *
Benjamin Peterson52b94082019-09-25 21:33:58 -070090NS(findEncoding)(const ENCODING *enc, const char *ptr, const char *end) {
91# define ENCODING_MAX 128
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +000092 char buf[ENCODING_MAX];
93 char *p = buf;
94 int i;
95 XmlUtf8Convert(enc, &ptr, end, &p, p + ENCODING_MAX - 1);
96 if (ptr != end)
97 return 0;
98 *p = 0;
99 if (streqci(buf, KW_UTF_16) && enc->minBytesPerChar == 2)
100 return enc;
101 i = getEncodingIndex(buf);
102 if (i == UNKNOWN_ENC)
103 return 0;
104 return NS(encodings)[i];
105}
106
Martin v. Löwisfc03a942003-01-25 22:41:29 +0000107int
Benjamin Peterson52b94082019-09-25 21:33:58 -0700108NS(XmlParseXmlDecl)(int isGeneralTextEntity, const ENCODING *enc,
109 const char *ptr, const char *end, const char **badPtr,
110 const char **versionPtr, const char **versionEndPtr,
111 const char **encodingName, const ENCODING **encoding,
112 int *standalone) {
113 return doParseXmlDecl(NS(findEncoding), isGeneralTextEntity, enc, ptr, end,
114 badPtr, versionPtr, versionEndPtr, encodingName,
115 encoding, standalone);
Martin v. Löwis1dbb1ca2002-02-11 23:13:04 +0000116}
Gregory P. Smith7c6309c2012-07-14 14:12:35 -0700117
118#endif /* XML_TOK_NS_C */