blob: 9ca555bf5310de2000440e6fa49a90aa650d111a [file] [log] [blame]
/* Copyright (c) 2002,2003, Stefan Haustein, Oberhausen, Rhld., Germany
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or
* sell copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
* IN THE SOFTWARE. */
// Contributors: Paul Hackenberger (unterminated entity handling in relaxed mode)
package org.kxml2.io;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.Reader;
import java.util.HashMap;
import java.util.Map;
import org.xmlpull.v1.XmlPullParser;
import org.xmlpull.v1.XmlPullParserException;
/**
* A pull based XML parser.
*/
public class KXmlParser implements XmlPullParser {
private static final char[] START_COMMENT = { '<', '!', '-', '-' };
private static final char[] END_COMMENT = { '-', '-', '>' };
private static final char[] START_CDATA = { '<', '!', '[', 'C', 'D', 'A', 'T', 'A', '[' };
private static final char[] END_CDATA = { ']', ']', '>' };
private static final char[] START_PROCESSING_INSTRUCTION = { '<', '?' };
private static final char[] END_PROCESSING_INSTRUCTION = { '?', '>' };
private static final char[] START_DOCTYPE = { '<', '!', 'D', 'O', 'C', 'T', 'Y', 'P', 'E' };
// no END_DOCTYPE because doctype must be parsed
static final private String UNEXPECTED_EOF = "Unexpected EOF";
static final private String ILLEGAL_TYPE = "Wrong event type";
static final private int XML_DECLARATION = 998;
// general
private String location;
private String version;
private Boolean standalone;
private boolean processNsp;
private boolean relaxed;
private boolean keepNamespaceAttributes;
private Map<String, String> entityMap;
private int depth;
private String[] elementStack = new String[16];
private String[] nspStack = new String[8];
private int[] nspCounts = new int[4];
// source
private Reader reader;
private String encoding;
private final char[] buffer = new char[8192];
private int position = 0;
private int limit = 0;
/*
* Track the number of newlines and columns preceding the current buffer. To
* compute the line and column of a position in the buffer, compute the line
* and column in the buffer and add the preceding values.
*/
private int bufferStartLine;
private int bufferStartColumn;
// the current token
private int type;
private boolean isWhitespace;
private String namespace;
private String prefix;
private String name;
private String text;
private boolean degenerated;
private int attributeCount;
/*
* The current element's attributes arranged in groups of 4:
* i + 0 = attribute namespace URI
* i + 1 = attribute namespace prefix
* i + 2 = attribute qualified name (may contain ":", as in "html:h1")
* i + 3 = attribute value
*/
private String[] attributes = new String[16];
private String error;
private boolean unresolved;
private boolean token;
/**
* Retains namespace attributes like {@code xmlns="http://foo"} or {@code xmlns:foo="http:foo"}
* in pulled elements. Most applications will only be interested in the effective namespaces of
* their elements, so these attributes aren't useful. But for structure preserving wrappers like
* DOM, it is necessary to keep the namespace data around.
*/
public void keepNamespaceAttributes() {
this.keepNamespaceAttributes = true;
}
private boolean isProp(String n1, boolean prop, String n2) {
if (!n1.startsWith("http://xmlpull.org/v1/doc/")) {
return false;
}
if (prop) {
return n1.substring(42).equals(n2);
} else {
return n1.substring(40).equals(n2);
}
}
private boolean adjustNsp() throws XmlPullParserException {
boolean any = false;
for (int i = 0; i < attributeCount << 2; i += 4) {
String attrName = attributes[i + 2];
int cut = attrName.indexOf(':');
String prefix;
if (cut != -1) {
prefix = attrName.substring(0, cut);
attrName = attrName.substring(cut + 1);
} else if (attrName.equals("xmlns")) {
prefix = attrName;
attrName = null;
} else {
continue;
}
if (!prefix.equals("xmlns")) {
any = true;
} else {
int j = (nspCounts[depth]++) << 1;
nspStack = ensureCapacity(nspStack, j + 2);
nspStack[j] = attrName;
nspStack[j + 1] = attributes[i + 3];
if (attrName != null && attributes[i + 3].isEmpty()) {
checkRelaxed("illegal empty namespace");
}
if (keepNamespaceAttributes) {
// explicitly set the namespace for unprefixed attributes
// such as xmlns="http://foo"
attributes[i] = "http://www.w3.org/2000/xmlns/";
any = true;
} else {
System.arraycopy(
attributes,
i + 4,
attributes,
i,
((--attributeCount) << 2) - i);
i -= 4;
}
}
}
if (any) {
for (int i = (attributeCount << 2) - 4; i >= 0; i -= 4) {
String attrName = attributes[i + 2];
int cut = attrName.indexOf(':');
if (cut == 0 && !relaxed) {
throw new RuntimeException(
"illegal attribute name: " + attrName + " at " + this);
} else if (cut != -1) {
String attrPrefix = attrName.substring(0, cut);
attrName = attrName.substring(cut + 1);
String attrNs = getNamespace(attrPrefix);
if (attrNs == null && !relaxed) {
throw new RuntimeException(
"Undefined Prefix: " + attrPrefix + " in " + this);
}
attributes[i] = attrNs;
attributes[i + 1] = attrPrefix;
attributes[i + 2] = attrName;
}
}
}
int cut = name.indexOf(':');
if (cut == 0) {
checkRelaxed("illegal tag name: " + name);
}
if (cut != -1) {
prefix = name.substring(0, cut);
name = name.substring(cut + 1);
}
this.namespace = getNamespace(prefix);
if (this.namespace == null) {
if (prefix != null) {
checkRelaxed("undefined prefix: " + prefix);
}
this.namespace = NO_NAMESPACE;
}
return any;
}
private String[] ensureCapacity(String[] arr, int required) {
if (arr.length >= required) {
return arr;
}
String[] bigger = new String[required + 16];
System.arraycopy(arr, 0, bigger, 0, arr.length);
return bigger;
}
private void checkRelaxed(String errorMessage) throws XmlPullParserException {
if (!relaxed) {
throw new XmlPullParserException(errorMessage, this, null);
}
if (error == null) {
error = "Error: " + errorMessage;
}
}
/**
* Common base for next() and nextToken(). Clears the state, except from txtPos and whitespace.
* Does not set the type variable.
*/
private void nextImpl() throws IOException, XmlPullParserException {
if (reader == null) {
throw new XmlPullParserException("setInput() must be called first.", this, null);
}
if (type == END_TAG) {
depth--;
}
while (true) {
attributeCount = -1;
// degenerated needs to be handled before error because of possible
// processor expectations(!)
if (degenerated) {
degenerated = false;
type = END_TAG;
return;
}
if (error != null) {
text = error;
error = null;
type = COMMENT;
return;
}
prefix = null;
name = null;
namespace = null;
type = peekType();
switch (type) {
case ENTITY_REF:
if (token) {
StringBuilder entityTextBuilder = new StringBuilder();
readEntity(entityTextBuilder);
text = entityTextBuilder.toString();
return;
}
// fall-through
case TEXT:
text = readValue('<', !token, false);
if (depth == 0 && isWhitespace) {
type = IGNORABLE_WHITESPACE;
}
return;
case START_TAG:
text = null; // TODO: fix next()/nextToken() so this is handled there
parseStartTag(false);
return;
case END_TAG:
readEndTag();
return;
case END_DOCUMENT:
return;
case XML_DECLARATION:
readXmlDeclaration();
continue;
case PROCESSING_INSTRUCTION:
read(START_PROCESSING_INSTRUCTION);
if (token) {
text = readUntil(END_PROCESSING_INSTRUCTION, true);
} else {
readUntil(END_PROCESSING_INSTRUCTION, false);
}
return;
case DOCDECL:
readDoctype(token);
return;
case CDSECT:
String oldText = text;
read(START_CDATA);
text = readUntil(END_CDATA, true);
if (oldText != null) {
text = oldText + text; // TODO: fix next()/nextToken() so this is handled there
}
return;
case COMMENT:
read(START_COMMENT);
if (token) {
text = readUntil(END_COMMENT, true);
} else {
readUntil(END_COMMENT, false);
}
return;
}
}
}
/**
* Reads text until the specified delimiter is encountered. Consumes the
* text and the delimiter.
*
* @param returnText true to return the read text excluding the delimiter;
* false to return null.
*/
private String readUntil(char[] delimiter, boolean returnText)
throws IOException, XmlPullParserException {
int previous = -1;
int start = position;
StringBuilder result = null;
search:
while (true) {
if (position + delimiter.length >= limit) {
if (start < position && returnText) {
if (result == null) {
result = new StringBuilder();
}
result.append(buffer, start, position - start);
}
if (!fillBuffer(delimiter.length)) {
checkRelaxed(UNEXPECTED_EOF);
type = COMMENT;
return null;
}
start = position;
}
// TODO: replace with Arrays.equals(buffer, position, delimiter, 0, delimiter.length)
// when the VM has better method inlining
for (int i = 0; i < delimiter.length; i++) {
if (buffer[position + i] != delimiter[i]) {
previous = buffer[position];
position++;
continue search;
}
}
break;
}
if (delimiter == END_COMMENT && previous == '-') {
checkRelaxed("illegal comment delimiter: --->");
}
int end = position;
position += delimiter.length;
if (!returnText) {
return null;
} else if (result == null) {
return new String(buffer, start, end - start);
} else {
result.append(buffer, start, end - start);
return result.toString();
}
}
/**
* Returns true if an XML declaration was read.
*/
private boolean readXmlDeclaration() throws IOException, XmlPullParserException {
if (bufferStartLine != 0 || bufferStartColumn != 0 || position != 0) {
checkRelaxed("processing instructions must not start with xml");
}
read(START_PROCESSING_INSTRUCTION);
parseStartTag(true);
if (attributeCount < 1 || !"version".equals(attributes[2])) {
checkRelaxed("version expected");
}
version = attributes[3];
int pos = 1;
if (pos < attributeCount && "encoding".equals(attributes[2 + 4])) {
encoding = attributes[3 + 4];
pos++;
}
if (pos < attributeCount && "standalone".equals(attributes[4 * pos + 2])) {
String st = attributes[3 + 4 * pos];
if ("yes".equals(st)) {
standalone = Boolean.TRUE;
} else if ("no".equals(st)) {
standalone = Boolean.FALSE;
} else {
checkRelaxed("illegal standalone value: " + st);
}
pos++;
}
if (pos != attributeCount) {
checkRelaxed("unexpected attributes in XML declaration");
}
isWhitespace = true;
text = null;
return true;
}
private void readDoctype(boolean assignText) throws IOException, XmlPullParserException {
read(START_DOCTYPE);
int start = position;
StringBuilder result = null;
int nesting = 1;
boolean quoted = false;
while (true) {
if (position >= limit) {
if (start < position && assignText) {
if (result == null) {
result = new StringBuilder();
}
result.append(buffer, start, position - start);
}
if (!fillBuffer(1)) {
checkRelaxed(UNEXPECTED_EOF);
return;
}
start = position;
}
char i = buffer[position++];
if (i == '\'') {
quoted = !quoted; // TODO: should this include a double quote as well?
} else if (i == '<') {
if (!quoted) {
nesting++;
}
} else if (i == '>') {
if (!quoted && --nesting == 0) {
break;
}
}
}
if (assignText) {
if (result == null) {
text = new String(buffer, start, position - start - 1); // omit the '>'
} else {
result.append(buffer, start, position - start - 1); // omit the '>'
text = result.toString();
}
}
}
private void readEndTag() throws IOException, XmlPullParserException {
read('<');
read('/');
name = readName(); // TODO: pass the expected name in as a hint?
skip();
read('>');
int sp = (depth - 1) * 4;
if (depth == 0) {
checkRelaxed("read end tag " + name + " with no tags open");
type = COMMENT;
return;
}
if (!relaxed) {
if (!name.equals(elementStack[sp + 3])) {
throw new XmlPullParserException(
"expected: /" + elementStack[sp + 3] + " read: " + name, this, null);
}
namespace = elementStack[sp];
prefix = elementStack[sp + 1];
name = elementStack[sp + 2];
}
}
/**
* Returns the type of the next token.
*/
private int peekType() throws IOException, XmlPullParserException {
if (position >= limit && !fillBuffer(1)) {
return END_DOCUMENT;
}
if (buffer[position] == '&') {
return ENTITY_REF;
} else if (buffer[position] == '<') {
if (position + 2 >= limit && !fillBuffer(3)) {
throw new XmlPullParserException("Dangling <", this, null);
}
if (buffer[position + 1] == '/') {
return END_TAG;
} else if (buffer[position + 1] == '?') {
// we're looking for "<?xml " with case insensitivity
if ((position + 5 < limit || fillBuffer(6))
&& (buffer[position + 2] == 'x' || buffer[position + 2] == 'X')
&& (buffer[position + 3] == 'm' || buffer[position + 3] == 'M')
&& (buffer[position + 4] == 'l' || buffer[position + 4] == 'L')
&& (buffer[position + 5] == ' ')) {
return XML_DECLARATION;
} else {
return PROCESSING_INSTRUCTION;
}
} else if (buffer[position + 1] == '!') {
if (buffer[position + 2] == START_DOCTYPE[2]) {
return DOCDECL;
} else if (buffer[position + 2] == START_CDATA[2]) {
return CDSECT;
} else if (buffer[position + 2] == START_COMMENT[2]) {
return COMMENT;
} else {
throw new XmlPullParserException("Unexpected <!", this, null);
}
} else {
return START_TAG;
}
} else {
return TEXT;
}
}
/**
* Sets name and attributes
*/
private void parseStartTag(boolean xmldecl) throws IOException, XmlPullParserException {
if (!xmldecl) {
read('<');
}
name = readName();
attributeCount = 0;
while (true) {
skip();
if (position >= limit && !fillBuffer(1)) {
checkRelaxed(UNEXPECTED_EOF);
return;
}
int c = buffer[position];
if (xmldecl) {
if (c == '?') {
position++;
read('>');
return;
}
} else {
if (c == '/') {
degenerated = true;
position++;
skip();
read('>');
break;
} else if (c == '>') {
position++;
break;
}
}
String attrName = readName();
int i = (attributeCount++) * 4;
attributes = ensureCapacity(attributes, i + 4);
attributes[i++] = "";
attributes[i++] = null;
attributes[i++] = attrName;
skip();
if (position >= limit && !fillBuffer(1)) {
checkRelaxed(UNEXPECTED_EOF);
return;
}
if (buffer[position] == '=') {
position++;
skip();
if (position >= limit && !fillBuffer(1)) {
checkRelaxed(UNEXPECTED_EOF);
return;
}
char delimiter = buffer[position];
if (delimiter == '\'' || delimiter == '"') {
position++;
} else if (relaxed) {
delimiter = ' ';
} else {
throw new XmlPullParserException("attr value delimiter missing!", this, null);
}
attributes[i] = readValue(delimiter, true, true);
if (delimiter != ' ') {
position++; // end quote
}
} else if (relaxed) {
attributes[i] = attrName;
} else {
checkRelaxed("Attr.value missing f. " + attrName);
attributes[i] = attrName;
}
}
int sp = depth++ * 4;
elementStack = ensureCapacity(elementStack, sp + 4);
elementStack[sp + 3] = name;
if (depth >= nspCounts.length) {
int[] bigger = new int[depth + 4];
System.arraycopy(nspCounts, 0, bigger, 0, nspCounts.length);
nspCounts = bigger;
}
nspCounts[depth] = nspCounts[depth - 1];
if (processNsp) {
adjustNsp();
} else {
namespace = "";
}
elementStack[sp] = namespace;
elementStack[sp + 1] = prefix;
elementStack[sp + 2] = name;
}
/**
* Reads an entity reference from the buffer, resolves it, and writes the
* resolved entity to {@code out}. If the entity cannot be read or resolved,
* {@code out} will contain the partial entity reference.
*/
private void readEntity(StringBuilder out) throws IOException, XmlPullParserException {
int start = out.length();
if (buffer[position++] != '&') {
throw new AssertionError();
}
out.append('&');
while (true) {
int c = peekCharacter();
if (c == ';') {
position++;
break;
} else if (c >= 128
|| (c >= '0' && c <= '9')
|| (c >= 'a' && c <= 'z')
|| (c >= 'A' && c <= 'Z')
|| c == '_'
|| c == '-'
|| c == '#') {
position++;
out.append((char) c);
} else if (relaxed) {
// intentionally leave the partial reference in 'out'
return;
} else {
throw new XmlPullParserException("unterminated entity ref", this, null);
}
}
String code = out.substring(start + 1);
out.delete(start, out.length());
if (token && type == ENTITY_REF) {
name = code;
}
if (code.charAt(0) == '#') {
// TODO: check IndexOutOfBoundsException?
// TODO: save an intermediate string for 'code' if unneeded?
int c = code.charAt(1) == 'x'
? Integer.parseInt(code.substring(2), 16)
: Integer.parseInt(code.substring(1));
// TODO: set unresolved to false?
out.append((char) c);
return;
}
String resolved = entityMap.get(code);
if (resolved != null) {
unresolved = false;
out.append(resolved);
return;
}
unresolved = true;
if (!token) {
checkRelaxed("unresolved: &" + code + ";");
// TODO: should the &code; show up in the text in relaxed mode?
}
}
/**
* Returns the current text or attribute value. This also has the side
* effect of setting isWhitespace to false if a non-whitespace character is
* encountered.
*
* @param delimiter {@code >} for text, {@code "} and {@code '} for quoted
* attributes, or a space for unquoted attributes.
*/
private String readValue(char delimiter, boolean resolveEntities,
boolean inAttributeValue) throws IOException, XmlPullParserException {
/*
* This method returns all of the characters from the current position
* through to an appropriate delimiter.
*
* If we're lucky (which we usually are), we'll return a single slice of
* the buffer. This fast path avoids allocating a string builder.
*
* There are 5 unlucky characters we could encounter:
* - "&": entities must be resolved.
* - "<": this isn't permitted in attributes unless relaxed.
* - "]": this requires a lookahead to defend against the forbidden
* CDATA section delimiter "]]>".
* - "\r": If a "\r" is followed by a "\n", we discard the "\r". If it
* isn't followed by "\n", we replace "\r" with either a "\n"
* in text nodes or a space in attribute values.
* - "\n": In attribute values, "\n" must be replaced with a space.
*
* We could also get unlucky by needing to refill the buffer midway
* through the text.
*/
int start = position;
StringBuilder result = null;
// if a text section was already started, prefix the start
if (text != null) {
result = new StringBuilder();
result.append(text);
}
while (true) {
/*
* Make sure we have at least a single character to read from the
* buffer. This mutates the buffer, so save the partial result
* to the slow path string builder first.
*/
if (position >= limit) {
if (start < position) {
if (result == null) {
result = new StringBuilder();
}
result.append(buffer, start, position - start);
}
if (!fillBuffer(1)) {
return result != null ? result.toString() : "";
}
start = position;
}
char c = buffer[position];
if (c == delimiter
|| (delimiter == ' ' && (c <= ' ' || c == '>'))
|| c == '&' && !resolveEntities) {
break;
}
if (c != '\r'
&& (c != '\n' || !inAttributeValue)
&& c != '&'
&& c != '<'
&& (c != ']' || inAttributeValue)) {
isWhitespace &= (c <= ' ');
position++;
continue;
}
/*
* We've encountered an unlucky character! Convert from fast
* path to slow path if we haven't done so already.
*/
if (result == null) {
result = new StringBuilder();
}
result.append(buffer, start, position - start);
if (c == '\r') {
if ((position + 1 < limit || fillBuffer(2)) && buffer[position + 1] == '\n') {
position++;
}
c = inAttributeValue ? ' ' : '\n';
} else if (c == '\n') {
c = ' ';
} else if (c == '&') {
isWhitespace = false; // TODO: what if the entity resolves to whitespace?
readEntity(result);
start = position;
continue;
} else if (c == '<') {
if (inAttributeValue) {
checkRelaxed("Illegal: \"<\" inside attribute value");
}
isWhitespace = false;
} else if (c == ']') {
if ((position + 2 < limit || fillBuffer(3))
&& buffer[position + 1] == ']' && buffer[position + 2] == '>') {
checkRelaxed("Illegal: \"]]>\" outside CDATA section");
}
isWhitespace = false;
} else {
throw new AssertionError();
}
position++;
result.append(c);
start = position;
}
if (result == null) {
return new String(buffer, start, position - start);
} else {
result.append(buffer, start, position - start);
return result.toString();
}
}
private void read(char expected) throws IOException, XmlPullParserException {
int c = peekCharacter();
if (c != expected) {
checkRelaxed("expected: '" + expected + "' actual: '" + ((char) c) + "'");
}
position++;
}
private void read(char[] chars) throws IOException, XmlPullParserException {
if (position + chars.length >= limit && !fillBuffer(chars.length)) {
checkRelaxed("expected: '" + new String(chars) + "' but was EOF");
return;
}
// TODO: replace with Arrays.equals(buffer, position, delimiter, 0, delimiter.length)
// when the VM has better method inlining
for (int i = 0; i < chars.length; i++) {
if (buffer[position + i] != chars[i]) {
checkRelaxed("expected: \"" + new String(chars) + "\" but was \""
+ new String(buffer, position, chars.length) + "...\"");
}
}
position += chars.length;
}
private int peekCharacter() throws IOException, XmlPullParserException {
if (position < limit || fillBuffer(1)) {
return buffer[position];
}
return -1;
}
/**
* Returns true once {@code limit - position >= minimum}. If the data is
* exhausted before that many characters are available, this returns
* false.
*/
private boolean fillBuffer(int minimum) throws IOException {
// Before clobbering the old characters, update where buffer starts
for (int i = 0; i < position; i++) {
if (buffer[i] == '\n') {
bufferStartLine++;
bufferStartColumn = 0;
} else {
bufferStartColumn++;
}
}
if (limit != position) {
limit -= position;
System.arraycopy(buffer, position, buffer, 0, limit);
} else {
limit = 0;
}
position = 0;
int total;
while ((total = reader.read(buffer, limit, buffer.length - limit)) != -1) {
limit += total;
if (limit >= minimum) {
return true;
}
}
return false;
}
/**
* Returns an element or attribute name. This is always non-empty for
* non-relaxed parsers.
*/
private String readName() throws IOException, XmlPullParserException {
if (position >= limit && !fillBuffer(1)) {
checkRelaxed("name expected");
return "";
}
int start = position;
StringBuilder result = null;
// read the first character
char c = buffer[position];
if ((c >= 'a' && c <= 'z')
|| (c >= 'A' && c <= 'Z')
|| c == '_'
|| c == ':'
|| c >= '\u00c0' // TODO: check the XML spec
|| relaxed) {
position++;
} else {
checkRelaxed("name expected");
return "";
}
while (true) {
/*
* Make sure we have at least a single character to read from the
* buffer. This mutates the buffer, so save the partial result
* to the slow path string builder first.
*/
if (position >= limit) {
if (result == null) {
result = new StringBuilder();
}
result.append(buffer, start, position - start);
if (!fillBuffer(1)) {
return result.toString();
}
start = position;
}
// read another character
c = buffer[position];
if ((c >= 'a' && c <= 'z')
|| (c >= 'A' && c <= 'Z')
|| (c >= '0' && c <= '9')
|| c == '_'
|| c == '-'
|| c == ':'
|| c == '.'
|| c >= '\u00b7') { // TODO: check the XML spec
position++;
continue;
}
// we encountered a non-name character. done!
if (result == null) {
return new String(buffer, start, position - start);
} else {
result.append(buffer, start, position - start);
return result.toString();
}
}
}
private void skip() throws IOException {
while (position < limit || fillBuffer(1)) {
int c = buffer[position];
if (c > ' ') {
break;
}
position++;
}
}
// public part starts here...
public void setInput(Reader reader) throws XmlPullParserException {
this.reader = reader;
type = START_DOCUMENT;
name = null;
namespace = null;
degenerated = false;
attributeCount = -1;
encoding = null;
version = null;
standalone = null;
if (reader == null) {
return;
}
position = 0;
limit = 0;
bufferStartLine = 0;
bufferStartColumn = 0;
depth = 0;
entityMap = new HashMap<String, String>();
entityMap.put("amp", "&");
entityMap.put("apos", "'");
entityMap.put("gt", ">");
entityMap.put("lt", "<");
entityMap.put("quot", "\"");
}
public void setInput(InputStream is, String _enc) throws XmlPullParserException {
position = 0;
limit = 0;
String enc = _enc;
if (is == null) {
throw new IllegalArgumentException();
}
try {
if (enc == null) {
// read the four bytes looking for an indication of the encoding in use
int firstFourBytes = 0;
while (limit < 4) {
int i = is.read();
if (i == -1) {
break;
}
firstFourBytes = (firstFourBytes << 8) | i;
buffer[limit++] = (char) i;
}
if (limit == 4) {
switch (firstFourBytes) {
case 0x00000FEFF: // UTF-32BE BOM
enc = "UTF-32BE";
limit = 0;
break;
case 0x0FFFE0000: // UTF-32LE BOM
enc = "UTF-32LE";
limit = 0;
break;
case 0x0000003c: // '>' in UTF-32BE
enc = "UTF-32BE";
buffer[0] = '<';
limit = 1;
break;
case 0x03c000000: // '<' in UTF-32LE
enc = "UTF-32LE";
buffer[0] = '<';
limit = 1;
break;
case 0x0003c003f: // "<?" in UTF-16BE
enc = "UTF-16BE";
buffer[0] = '<';
buffer[1] = '?';
limit = 2;
break;
case 0x03c003f00: // "<?" in UTF-16LE
enc = "UTF-16LE";
buffer[0] = '<';
buffer[1] = '?';
limit = 2;
break;
case 0x03c3f786d: // "<?xm" in ASCII etc.
while (true) {
int i = is.read();
if (i == -1) {
break;
}
buffer[limit++] = (char) i;
if (i == '>') {
String s = new String(buffer, 0, limit);
int i0 = s.indexOf("encoding");
if (i0 != -1) {
while (s.charAt(i0) != '"'
&& s.charAt(i0) != '\'') {
i0++;
}
char deli = s.charAt(i0++);
int i1 = s.indexOf(deli, i0);
enc = s.substring(i0, i1);
}
break;
}
}
default:
// handle a byte order mark followed by something other than <?
if ((firstFourBytes & 0x0ffff0000) == 0x0FEFF0000) {
enc = "UTF-16BE";
buffer[0] = (char) ((buffer[2] << 8) | buffer[3]);
limit = 1;
} else if ((firstFourBytes & 0x0ffff0000) == 0x0fffe0000) {
enc = "UTF-16LE";
buffer[0] = (char) ((buffer[3] << 8) | buffer[2]);
limit = 1;
} else if ((firstFourBytes & 0x0ffffff00) == 0x0EFBBBF00) {
enc = "UTF-8";
buffer[0] = buffer[3];
limit = 1;
}
}
}
}
if (enc == null) {
enc = "UTF-8";
}
int sc = limit;
setInput(new InputStreamReader(is, enc));
encoding = _enc;
limit = sc;
} catch (Exception e) {
throw new XmlPullParserException("Invalid stream or encoding: " + e, this, e);
}
}
public boolean getFeature(String feature) {
if (XmlPullParser.FEATURE_PROCESS_NAMESPACES.equals(feature)) {
return processNsp;
} else if (isProp(feature, false, "relaxed")) {
return relaxed;
} else {
return false;
}
}
public String getInputEncoding() {
return encoding;
}
public void defineEntityReplacementText(String entity, String value)
throws XmlPullParserException {
if (entityMap == null) {
throw new RuntimeException("entity replacement text must be defined after setInput!");
}
entityMap.put(entity, value);
}
public Object getProperty(String property) {
if (isProp(property, true, "xmldecl-version")) {
return version;
}
if (isProp(property, true, "xmldecl-standalone")) {
return standalone;
}
if (isProp(property, true, "location")) {
return location != null ? location : reader.toString();
}
return null;
}
public int getNamespaceCount(int depth) {
if (depth > this.depth) {
throw new IndexOutOfBoundsException();
}
return nspCounts[depth];
}
public String getNamespacePrefix(int pos) {
return nspStack[pos * 2];
}
public String getNamespaceUri(int pos) {
return nspStack[(pos * 2) + 1];
}
public String getNamespace(String prefix) {
if ("xml".equals(prefix)) {
return "http://www.w3.org/XML/1998/namespace";
}
if ("xmlns".equals(prefix)) {
return "http://www.w3.org/2000/xmlns/";
}
for (int i = (getNamespaceCount(depth) << 1) - 2; i >= 0; i -= 2) {
if (prefix == null) {
if (nspStack[i] == null) {
return nspStack[i + 1];
}
} else if (prefix.equals(nspStack[i])) {
return nspStack[i + 1];
}
}
return null;
}
public int getDepth() {
return depth;
}
public String getPositionDescription() {
StringBuilder buf = new StringBuilder(type < TYPES.length ? TYPES[type] : "unknown");
buf.append(' ');
if (type == START_TAG || type == END_TAG) {
if (degenerated) {
buf.append("(empty) ");
}
buf.append('<');
if (type == END_TAG) {
buf.append('/');
}
if (prefix != null) {
buf.append("{" + namespace + "}" + prefix + ":");
}
buf.append(name);
int cnt = attributeCount * 4;
for (int i = 0; i < cnt; i += 4) {
buf.append(' ');
if (attributes[i + 1] != null) {
buf.append("{" + attributes[i] + "}" + attributes[i + 1] + ":");
}
buf.append(attributes[i + 2] + "='" + attributes[i + 3] + "'");
}
buf.append('>');
} else if (type == IGNORABLE_WHITESPACE) {
;
} else if (type != TEXT) {
buf.append(getText());
} else if (isWhitespace) {
buf.append("(whitespace)");
} else {
String text = getText();
if (text.length() > 16) {
text = text.substring(0, 16) + "...";
}
buf.append(text);
}
buf.append("@" + getLineNumber() + ":" + getColumnNumber());
if (location != null) {
buf.append(" in ");
buf.append(location);
} else if (reader != null) {
buf.append(" in ");
buf.append(reader.toString());
}
return buf.toString();
}
public int getLineNumber() {
int result = bufferStartLine;
for (int i = 0; i < position; i++) {
if (buffer[i] == '\n') {
result++;
}
}
return result + 1; // the first line is '1'
}
public int getColumnNumber() {
int result = bufferStartColumn;
for (int i = 0; i < position; i++) {
if (buffer[i] == '\n') {
result = 0;
} else {
result++;
}
}
return result + 1; // the first column is '1'
}
public boolean isWhitespace() throws XmlPullParserException {
if (type != TEXT && type != IGNORABLE_WHITESPACE && type != CDSECT) {
throw new XmlPullParserException(ILLEGAL_TYPE, this, null);
}
return isWhitespace;
}
public String getText() {
if (type < TEXT || (type == ENTITY_REF && unresolved)) {
return null;
} else if (text == null) {
return "";
} else {
return text;
}
}
public char[] getTextCharacters(int[] poslen) {
String text = getText();
if (text == null) {
poslen[0] = -1;
poslen[1] = -1;
return null;
}
char[] result = text.toCharArray();
poslen[0] = 0;
poslen[1] = result.length;
return result;
}
public String getNamespace() {
return namespace;
}
public String getName() {
return name;
}
public String getPrefix() {
return prefix;
}
public boolean isEmptyElementTag() throws XmlPullParserException {
if (type != START_TAG) {
throw new XmlPullParserException(ILLEGAL_TYPE, this, null);
}
return degenerated;
}
public int getAttributeCount() {
return attributeCount;
}
public String getAttributeType(int index) {
return "CDATA";
}
public boolean isAttributeDefault(int index) {
return false;
}
public String getAttributeNamespace(int index) {
if (index >= attributeCount) {
throw new IndexOutOfBoundsException();
}
return attributes[index * 4];
}
public String getAttributeName(int index) {
if (index >= attributeCount) {
throw new IndexOutOfBoundsException();
}
return attributes[(index * 4) + 2];
}
public String getAttributePrefix(int index) {
if (index >= attributeCount) {
throw new IndexOutOfBoundsException();
}
return attributes[(index * 4) + 1];
}
public String getAttributeValue(int index) {
if (index >= attributeCount) {
throw new IndexOutOfBoundsException();
}
return attributes[(index * 4) + 3];
}
public String getAttributeValue(String namespace, String name) {
for (int i = (attributeCount * 4) - 4; i >= 0; i -= 4) {
if (attributes[i + 2].equals(name)
&& (namespace == null || attributes[i].equals(namespace))) {
return attributes[i + 3];
}
}
return null;
}
public int getEventType() throws XmlPullParserException {
return type;
}
public int next() throws XmlPullParserException, IOException {
text = null;
isWhitespace = true;
int minType = 9999;
token = false;
do {
nextImpl();
if (type < minType) {
minType = type;
}
} while (minType > ENTITY_REF // ignorable
|| (minType >= TEXT && peekType() >= TEXT));
type = minType;
if (type > TEXT) {
type = TEXT;
}
return type;
}
public int nextToken() throws XmlPullParserException, IOException {
isWhitespace = true;
text = null;
token = true;
nextImpl();
return type;
}
// utility methods to make XML parsing easier ...
public int nextTag() throws XmlPullParserException, IOException {
next();
if (type == TEXT && isWhitespace) {
next();
}
if (type != END_TAG && type != START_TAG) {
throw new XmlPullParserException("unexpected type", this, null);
}
return type;
}
public void require(int type, String namespace, String name)
throws XmlPullParserException, IOException {
if (type != this.type
|| (namespace != null && !namespace.equals(getNamespace()))
|| (name != null && !name.equals(getName()))) {
throw new XmlPullParserException(
"expected: " + TYPES[type] + " {" + namespace + "}" + name, this, null);
}
}
public String nextText() throws XmlPullParserException, IOException {
if (type != START_TAG) {
throw new XmlPullParserException("precondition: START_TAG", this, null);
}
next();
String result;
if (type == TEXT) {
result = getText();
next();
} else {
result = "";
}
if (type != END_TAG) {
throw new XmlPullParserException("END_TAG expected", this, null);
}
return result;
}
public void setFeature(String feature, boolean value) throws XmlPullParserException {
if (XmlPullParser.FEATURE_PROCESS_NAMESPACES.equals(feature)) {
processNsp = value;
} else if (isProp(feature, false, "relaxed")) {
// "http://xmlpull.org/v1/doc/features.html#relaxed"
relaxed = value;
} else {
throw new XmlPullParserException("unsupported feature: " + feature, this, null);
}
}
public void setProperty(String property, Object value) throws XmlPullParserException {
if (isProp(property, true, "location")) {
location = String.valueOf(value);
} else {
throw new XmlPullParserException("unsupported property: " + property);
}
}
}