/**************************************************************************** ** $Id$ ** ** Implementation of QXmlSimpleReader and related classes. ** ** Created : 000518 ** ** Copyright (C) 1992-2000 Trolltech AS. All rights reserved. ** ** This file is part of the XML module of the Qt GUI Toolkit. ** ** This file may be distributed under the terms of the Q Public License ** as defined by Trolltech AS of Norway and appearing in the file ** LICENSE.QPL included in the packaging of this file. ** ** This file may be distributed and/or modified under the terms of the ** GNU General Public License version 2 as published by the Free Software ** Foundation and appearing in the file LICENSE.GPL included in the ** packaging of this file. ** ** Licensees holding valid Qt Enterprise Edition licenses may use this ** file in accordance with the Qt Commercial License Agreement provided ** with the Software. ** ** This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE ** WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. ** ** See http://www.trolltech.com/pricing.html or email sales@trolltech.com for ** information about Qt Commercial License Agreements. ** See http://www.trolltech.com/qpl/ for QPL licensing information. ** See http://www.trolltech.com/gpl/ for GPL licensing information. ** ** Contact info@trolltech.com if any conditions of this licensing are ** not clear to you. ** **********************************************************************/ /****************************************** * DOM support is disabled in QT 2.3.7 for sharp zaurus. * Because of that we copied the code from 2.3.7 into qtcompat and enabled it * there. * Copyright (c) 2004 Ulf Schenk * * $Id$ ******************************************/ #define QT_XML_CPP #include "qxml.h" #include "qtextcodec.h" #include "qbuffer.h" //US #ifndef QT_NO_XML // NOT REVISED // Error strings for the XML reader #define XMLERR_OK "no error occured" #define XMLERR_TAGMISMATCH "tag mismatch" #define XMLERR_UNEXPECTEDEOF "unexpected end of file" #define XMLERR_FINISHEDPARSINGWHILENOTEOF "parsing is finished but end of file is not reached" #define XMLERR_LETTEREXPECTED "letter is expected" #define XMLERR_ERRORPARSINGELEMENT "error while parsing element" #define XMLERR_ERRORPARSINGPROLOG "error while parsing prolog" #define XMLERR_ERRORPARSINGMAINELEMENT "error while parsing main element" #define XMLERR_ERRORPARSINGCONTENT "error while parsing content" #define XMLERR_ERRORPARSINGNAME "error while parsing name" #define XMLERR_ERRORPARSINGNMTOKEN "error while parsing Nmtoken" #define XMLERR_ERRORPARSINGATTRIBUTE "error while parsing attribute" #define XMLERR_ERRORPARSINGMISC "error while parsing misc" #define XMLERR_ERRORPARSINGCHOICE "error while parsing choice or seq" #define XMLERR_ERRORBYCONSUMER "error triggered by consumer" #define XMLERR_UNEXPECTEDCHARACTER "unexpected character" #define XMLERR_EQUALSIGNEXPECTED "expected '=' but not found" #define XMLERR_QUOTATIONEXPECTED "expected \" or ' but not found" #define XMLERR_ERRORPARSINGREFERENCE "error while parsing reference" #define XMLERR_ERRORPARSINGPI "error while parsing processing instruction" #define XMLERR_ERRORPARSINGATTLISTDECL "error while parsing attribute list declaration" #define XMLERR_ERRORPARSINGATTTYPE "error while parsing attribute type declaration" #define XMLERR_ERRORPARSINGATTVALUE "error while parsing attribute value declaration" #define XMLERR_ERRORPARSINGELEMENTDECL "error while parsing element declaration" #define XMLERR_ERRORPARSINGENTITYDECL "error while parsing entity declaration" #define XMLERR_ERRORPARSINGNOTATIONDECL "error while parsing notation declaration" #define XMLERR_ERRORPARSINGEXTERNALID "error while parsing external id" #define XMLERR_ERRORPARSINGCOMMENT "error while parsing comment" #define XMLERR_ERRORPARSINGENTITYVALUE "error while parsing entity value declaration" #define XMLERR_CDSECTHEADEREXPECTED "expected the header for a cdata section" #define XMLERR_MORETHANONEDOCTYPE "more than one document type definition" #define XMLERR_ERRORPARSINGDOCTYPE "error while parsing document type definition" #define XMLERR_INVALIDNAMEFORPI "invalid name for processing instruction" #define XMLERR_VERSIONEXPECTED "version expected while reading the XML declaration" #define XMLERR_EDECLORSDDECLEXPECTED "EDecl or SDDecl expected while reading the XML declaration" #define XMLERR_SDDECLEXPECTED "SDDecl expected while reading the XML declaration" #define XMLERR_WRONGVALUEFORSDECL "wrong value for standalone declaration" #define XMLERR_UNPARSEDENTITYREFERENCE "unparsed entity reference in wrong context" #define XMLERR_INTERNALGENERALENTITYINDTD "internal general entity reference not allowed in DTD" #define XMLERR_EXTERNALGENERALENTITYINDTD "external parsed general entity reference not allowed in DTD" #define XMLERR_EXTERNALGENERALENTITYINAV "external parsed general entity reference not allowed in attribute value" // the constants for the lookup table static const signed char cltWS = 0; // white space static const signed char cltPer = 1; // % static const signed char cltAmp = 2; // & static const signed char cltGt = 3; // > static const signed char cltLt = 4; // < static const signed char cltSlash = 5; // / static const signed char cltQm = 6; // ? static const signed char cltEm = 7; // ! static const signed char cltDash = 8; // - static const signed char cltCB = 9; // ] static const signed char cltOB = 10; // [ static const signed char cltEq = 11; // = static const signed char cltDq = 12; // " static const signed char cltSq = 13; // ' static const signed char cltUnknown = 14; // character lookup table static const signed char charLookupTable[256]={ cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x00 - 0x07 cltUnknown, // 0x08 cltWS, // 0x09 \t cltWS, // 0x0A \n cltUnknown, // 0x0B cltUnknown, // 0x0C cltWS, // 0x0D \r cltUnknown, // 0x0E cltUnknown, // 0x0F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x17 - 0x16 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x18 - 0x1F cltWS, // 0x20 Space cltEm, // 0x21 ! cltDq, // 0x22 " cltUnknown, // 0x23 cltUnknown, // 0x24 cltPer, // 0x25 % cltAmp, // 0x26 & cltSq, // 0x27 ' cltUnknown, // 0x28 cltUnknown, // 0x29 cltUnknown, // 0x2A cltUnknown, // 0x2B cltUnknown, // 0x2C cltDash, // 0x2D - cltUnknown, // 0x2E cltSlash, // 0x2F / cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x30 - 0x37 cltUnknown, // 0x38 cltUnknown, // 0x39 cltUnknown, // 0x3A cltUnknown, // 0x3B cltLt, // 0x3C < cltEq, // 0x3D = cltGt, // 0x3E > cltQm, // 0x3F ? cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x40 - 0x47 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x48 - 0x4F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x50 - 0x57 cltUnknown, // 0x58 cltUnknown, // 0x59 cltUnknown, // 0x5A cltOB, // 0x5B [ cltUnknown, // 0x5C cltCB, // 0x5D ] cltUnknown, // 0x5E cltUnknown, // 0x5F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x60 - 0x67 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x68 - 0x6F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x70 - 0x77 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x78 - 0x7F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x80 - 0x87 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x88 - 0x8F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x90 - 0x97 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0x98 - 0x9F cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xA0 - 0xA7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xA8 - 0xAF cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xB0 - 0xB7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xB8 - 0xBF cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xC0 - 0xC7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xC8 - 0xCF cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xD0 - 0xD7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xD8 - 0xDF cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xE0 - 0xE7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xE8 - 0xEF cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, // 0xF0 - 0xF7 cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown, cltUnknown // 0xF8 - 0xFF }; class QXmlNamespaceSupportPrivate { }; class QXmlAttributesPrivate { }; class QXmlInputSourcePrivate { }; class QXmlParseExceptionPrivate { }; class QXmlLocatorPrivate { }; class QXmlDefaultHandlerPrivate { }; #if defined(Q_FULL_TEMPLATE_INSTANTIATION) bool operator==( const QMap<QString, QString>, const QMap<QString, QString> ) { return FALSE; } #endif /*! \class QXmlParseException qxml.h \brief The QXmlParseException class is used to report errors with the QXmlErrorHandler interface. \module XML \sa QXmlErrorHandler */ /*! \fn QXmlParseException::QXmlParseException( const QString& name, int c, int l, const QString& p, const QString& s ) Constructs a parse exception with the error string \a name in the column \a c and line \a l for the public identifier \a p and the system identifier \a s. */ /*! Returns the error message. */ QString QXmlParseException::message() const { return msg; } /*! Returns the column number the error occured. */ int QXmlParseException::columnNumber() const { return column; } /*! Returns the line number the error occured. */ int QXmlParseException::lineNumber() const { return line; } /*! Returns the public identifier the error occured. */ QString QXmlParseException::publicId() const { return pub; } /*! Returns the system identifier the error occured. */ QString QXmlParseException::systemId() const { return sys; } /*! \class QXmlLocator qxml.h \brief The QXmlLocator class provides the XML handler classes with information about the actual parsing position. \module XML The reader reports a QXmlLocator to the content handler before he starts to parse the document. This is done with the QXmlContentHandler::setDocumentLocator() function. The handler classes can now use this locator to get the actual position the reader is at. */ /*! \fn QXmlLocator::QXmlLocator( QXmlSimpleReader* parent ) Constructor. */ /*! \fn QXmlLocator::~QXmlLocator() Destructor. */ /*! Gets the column number (starting with 1) or -1 if there is no column number available. */ int QXmlLocator::columnNumber() { return ( reader->columnNr == -1 ? -1 : reader->columnNr + 1 ); } /*! Gets the line number (starting with 1) or -1 if there is no line number available. */ int QXmlLocator::lineNumber() { return ( reader->lineNr == -1 ? -1 : reader->lineNr + 1 ); } /********************************************* * * QXmlNamespaceSupport * *********************************************/ /*! \class QXmlNamespaceSupport qxml.h \brief The QXmlNamespaceSupport class is a helper class for XML readers which want to include namespace support. \module XML It provides some functions that makes it easy to handle namespaces. Its main use is for subclasses of QXmlReader which want to provide namespace support. See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ /*! Constructs a QXmlNamespaceSupport. */ QXmlNamespaceSupport::QXmlNamespaceSupport() { reset(); } /*! Destructs a QXmlNamespaceSupport. */ QXmlNamespaceSupport::~QXmlNamespaceSupport() { } /*! This function declares a prefix in the current namespace context; the prefix will remain in force until this context is popped, unless it is shadowed in a descendant context. Note that there is an asymmetry in this library: while prefix() will not return the default "" prefix, even if you have declared one; to check for a default prefix, you have to look it up explicitly using uri(). This asymmetry exists to make it easier to look up prefixes for attribute names, where the default prefix is not allowed. */ void QXmlNamespaceSupport::setPrefix( const QString& pre, const QString& uri ) { if( pre.isNull() ) { ns.insert( "", uri ); } else { ns.insert( pre, uri ); } } /*! Returns one of the prefixes mapped to a namespace URI. If more than one prefix is currently mapped to the same URI, this function will make an arbitrary selection; if you want all of the prefixes, use the prefixes() function instead. Note: this will never return the empty (default) prefix; to check for a default prefix, use the uri() function with an argument of "". */ QString QXmlNamespaceSupport::prefix( const QString& uri ) const { QMap<QString, QString>::ConstIterator itc, it = ns.begin(); while ( (itc=it) != ns.end() ) { ++it; if ( itc.data() == uri && !itc.key().isEmpty() ) return itc.key(); } return ""; } /*! Looks up a prefix in the current context and returns the currently-mapped namespace URI. Use the empty string ("") for the default namespace. */ QString QXmlNamespaceSupport::uri( const QString& prefix ) const { const QString& returi = ns[ prefix ]; return returi; } /*! Splits the name at the ':' and returns the prefix and the local name. */ void QXmlNamespaceSupport::splitName( const QString& qname, QString& prefix, QString& localname ) const { uint pos; // search the ':' for( pos=0; pos<qname.length(); pos++ ) { if ( qname.at(pos) == ':' ) break; } // and split prefix = qname.left( pos ); localname = qname.mid( pos+1 ); } /*! Processes a raw XML 1.0 name in the current context by removing the prefix and looking it up among the prefixes currently declared. First parameter is the raw XML 1.0 name to be processed. The second parameter is a flag wheter the name is the name of an attribute (TRUE) or not (FALSE). The return values will be stored in the last two parameters as follows: <ul> <li> The namespace URI, or an empty string if none is in use. <li> The local name (without prefix). </ul> If the raw name has a prefix that has not been declared, then the return value will be empty. Note that attribute names are processed differently than element names: an unprefixed element name will received the default namespace (if any), while an unprefixed element name will not */ void QXmlNamespaceSupport::processName( const QString& qname, bool isAttribute, QString& nsuri, QString& localname ) const { uint pos; // search the ':' for( pos=0; pos<qname.length(); pos++ ) { if ( qname.at(pos) == ':' ) break; } if ( pos < qname.length() ) { // there was a ':' nsuri = uri( qname.left( pos ) ); localname = qname.mid( pos+1 ); } else { // there was no ':' if ( isAttribute ) { nsuri = ""; // attributes don't take default namespace } else { nsuri = uri( "" ); // get default namespace } localname = qname; } } /*! Returns an enumeration of all prefixes currently declared. Note: if there is a default prefix, it will not be returned in this enumeration; check for the default prefix using uri() with an argument of "". */ QStringList QXmlNamespaceSupport::prefixes() const { QStringList list; QMap<QString, QString>::ConstIterator itc, it = ns.begin(); while ( (itc=it) != ns.end() ) { ++it; if ( !itc.key().isEmpty() ) list.append( itc.key() ); } return list; } /*! Returns a list of all prefixes currently declared for a URI. The xml: prefix will be included. If you want only one prefix that's mapped to the namespace URI, and you don't care which one you get, use the prefix() function instead. Note: the empty (default) prefix is never included in this enumeration; to check for the presence of a default namespace, use uri() with an argument of "". */ QStringList QXmlNamespaceSupport::prefixes( const QString& uri ) const { QStringList list; QMap<QString, QString>::ConstIterator itc, it = ns.begin(); while ( (itc=it) != ns.end() ) { ++it; if ( itc.data() == uri && !itc.key().isEmpty() ) list.append( itc.key() ); } return list; } /*! Starts a new namespace context. Normally, you should push a new context at the beginning of each XML element: the new context will automatically inherit the declarations of its parent context, but it will also keep track of which declarations were made within this context. */ void QXmlNamespaceSupport::pushContext() { nsStack.push( ns ); } /*! Reverts to the previous namespace context. Normally, you should pop the context at the end of each XML element. After popping the context, all namespace prefix mappings that were previously in force are restored. */ void QXmlNamespaceSupport::popContext() { if( !nsStack.isEmpty() ) ns = nsStack.pop(); } /*! Resets this namespace support object for reuse. */ void QXmlNamespaceSupport::reset() { nsStack.clear(); ns.clear(); ns.insert( "xml", "http://www.w3.org/XML/1998/namespace" ); // the XML namespace } /********************************************* * * QXmlAttributes * *********************************************/ /*! \class QXmlAttributes qxml.h \brief The QXmlAttributes class provides XML attributes. \module XML If attributes are reported by QXmlContentHandler::startElement() this class is used to pass the attribute values. It provides you with different functions to access the attribute names and values. */ /*! \fn QXmlAttributes::QXmlAttributes() Constructs an empty attribute list. */ /*! \fn QXmlAttributes::~QXmlAttributes() Destructs attributes. */ /*! Look up the index of an attribute by an XML 1.0 qualified name. Returns the index of the attribute (starting with 0) or -1 if it wasn't found. See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ int QXmlAttributes::index( const QString& qName ) const { return qnameList.findIndex( qName ); } /*! Looks up the index of an attribute by a namespace name. \a uri specifies the namespace URI, or the empty string if the name has no namespace URI. \a localPart specifies the attribute's local name. Returns the index of the attribute (starting with 0) or -1 if it wasn't found. See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ int QXmlAttributes::index( const QString& uri, const QString& localPart ) const { uint count = uriList.count(); for ( uint i=0; i<count; i++ ) { if ( uriList[i] == uri && localnameList[i] == localPart ) return i; } return -1; } /*! Returns the number of attributes in the list. */ int QXmlAttributes::length() const { return valueList.count(); } /*! Looks up an attribute's local name by index (starting with 0). See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ QString QXmlAttributes::localName( int index ) const { return localnameList[index]; } /*! Looks up an attribute's XML 1.0 qualified name by index (starting with 0). See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ QString QXmlAttributes::qName( int index ) const { return qnameList[index]; } /*! Looks up an attribute's namespace URI by index (starting with 0). See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ QString QXmlAttributes::uri( int index ) const { return uriList[index]; } /*! Looks up an attribute's type by index (starting with 0). At the moment only 'CDATA' is returned. */ QString QXmlAttributes::type( int ) const { return "CDATA"; } /*! Looks up an attribute's type by XML 1.0 qualified name. At the moment only 'CDATA' is returned. */ QString QXmlAttributes::type( const QString& ) const { return "CDATA"; } /*! Looks up an attribute's type by namespace name. The first parameter specifies the namespace URI, or the empty string if the name has no namespace URI. The second parameter specifies the attribute's local name. At the moment only 'CDATA' is returned. */ QString QXmlAttributes::type( const QString&, const QString& ) const { return "CDATA"; } /*! Looks up an attribute's value by index (starting with 0). */ QString QXmlAttributes::value( int index ) const { return valueList[index]; } /*! Looks up an attribute's value by XML 1.0 qualified name. See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ QString QXmlAttributes::value( const QString& qName ) const { int i = index( qName ); if ( i == -1 ) return QString::null; return valueList[ i ]; } /*! Looks up an attribute's value by namespace name. \a uri specifies the namespace URI, or the empty string if the name has no namespace URI. \a localName specifies the attribute's local name. See also the <a href="xml-sax.html#namespaces">namespace description</a>. */ QString QXmlAttributes::value( const QString& uri, const QString& localName ) const { int i = index( uri, localName ); if ( i == -1 ) return QString::null; return valueList[ i ]; } /********************************************* * * QXmlInputSource * *********************************************/ /*! \class QXmlInputSource qxml.h \brief The QXmlInputSource class is the source where XML data is read from. \module XML All subclasses of QXmlReader read the input from this class. */ /*! Returns all the data this input source contains. */ const QString& QXmlInputSource::data() const { return input; } /*! Constructs a input source which contains no data. */ QXmlInputSource::QXmlInputSource( ) { input = ""; } /*! Constructs a input source and get the data from the text stream. */ QXmlInputSource::QXmlInputSource( QTextStream& stream ) { QByteArray rawData; if ( stream.device()->isDirectAccess() ) { rawData = stream.device()->readAll(); } else { int nread = 0; const int bufsize = 512; while ( !stream.device()->atEnd() ) { rawData.resize( nread + bufsize ); nread += stream.device()->readBlock( rawData.data()+nread, bufsize ); } rawData.resize( nread ); } readInput( rawData ); } /*! Constructs a input source and get the data from a file. If the file cannot be read the input source is empty. */ QXmlInputSource::QXmlInputSource( QFile& file ) { if ( !file.open(IO_ReadOnly) ) { input = ""; return; } QByteArray rawData = file.readAll(); readInput( rawData ); file.close(); } /*! Destructor. */ QXmlInputSource::~QXmlInputSource() { } /*! Sets the data of the input source to \a dat. */ void QXmlInputSource::setData( const QString& dat ) { input = dat; } /*! Read the XML file from the byte array; try to recoginize the encoding. */ // ### The input source should not do the encoding detection! void QXmlInputSource::readInput( QByteArray& rawData ) { QBuffer buf( rawData ); buf.open( IO_ReadOnly ); QTextStream *stream = new QTextStream( &buf ); QChar tmp; // assume UTF8 or UTF16 at first stream->setEncoding( QTextStream::UnicodeUTF8 ); input = ""; // read the first 5 characters for ( int i=0; i<5; i++ ) { *stream >> tmp; input += tmp; } // starts the document with an XML declaration? if ( input == "<?xml" ) { // read the whole XML declaration do { *stream >> tmp; input += tmp; } while( tmp != '>' ); // and try to find out if there is an encoding int pos = input.find( "encoding" ); if ( pos != -1 ) { QString encoding; do { pos++; if ( pos > (int)input.length() ) goto finished; } while( input[pos] != '"' && input[pos] != '\'' ); pos++; while( input[pos] != '"' && input[pos] != '\'' ) { encoding += input[pos]; pos++; if ( pos > (int)input.length() ) goto finished; } delete stream; stream = new QTextStream( &buf ); stream->setCodec( QTextCodec::codecForName( encoding ) ); buf.reset(); input = ""; } } finished: input += stream->read(); delete stream; buf.close(); } /********************************************* * * QXmlDefaultHandler * *********************************************/ /*! \class QXmlContentHandler qxml.h \brief The QXmlContentHandler class provides an interface to report logical content of XML data. \module XML If the application needs to be informed of basic parsing events, it implements this interface and sets it with QXmlReader::setContentHandler(). The reader reports basic document-related events like the start and end of elements and character data through this interface. The order of events in this interface is very important, and mirrors the order of information in the document itself. For example, all of an element's content (character data, processing instructions, and/or subelements) will appear, in order, between the startElement() event and the corresponding endElement() event. The class QXmlDefaultHandler gives a default implementation for this interface; subclassing from this class is very convenient if you want only be informed of some parsing events. See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlDeclHandler QXmlEntityResolver QXmlErrorHandler QXmlLexicalHandler */ /*! \fn void QXmlContentHandler::setDocumentLocator( QXmlLocator* locator ) The reader calls this function before he starts parsing the document. The argument \a locator is a pointer to a QXmlLocator which allows the application to get the actual position of the parsing in the document. Do not destroy the \a locator; it is destroyed when the reader is destroyed (do not use the \a locator after the reader got destroyed). */ /*! \fn bool QXmlContentHandler::startDocument() The reader calls this function when he starts parsing the document. The reader will call this function only once before any other functions in this class or in the QXmlDTDHandler class are called (except QXmlContentHandler::setDocumentLocator()). If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa endDocument() */ /*! \fn bool QXmlContentHandler::endDocument() The reader calls this function after he has finished the parsing. It is only called once. It is the last function of all handler functions that is called. It is called after the reader has read all input or has abandoned parsing because of a fatal error. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa startDocument() */ /*! \fn bool QXmlContentHandler::startPrefixMapping( const QString& prefix, const QString& uri ) The reader calls this function to signal the begin of a prefix-URI namespace mapping scope. This information is not necessary for normal namespace processing since the reader automatically replaces prefixes for element and attribute names. Note that startPrefixMapping and endPrefixMapping calls are not guaranteed to be properly nested relative to each-other: all startPrefixMapping events will occur before the corresponding startElement event, and all endPrefixMapping events will occur after the corresponding endElement event, but their order is not otherwise guaranteed. The argument \a prefix is the namespace prefix being declared and the argument \a uri is the namespace URI the prefix is mapped to. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. See also the <a href="xml-sax.html#namespaces">namespace description</a>. \sa endPrefixMapping() */ /*! \fn bool QXmlContentHandler::endPrefixMapping( const QString& prefix ) The reader calls this function to signal the end of a prefix mapping. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. See also the <a href="xml-sax.html#namespaces">namespace description</a>. \sa startPrefixMapping() */ /*! \fn bool QXmlContentHandler::startElement( const QString& namespaceURI, const QString& localName, const QString& qName, const QXmlAttributes& atts ) The reader calls this function when he has parsed a start element tag. There will be a corresponding endElement() call when the corresponding end element tag was read. The startElement() and endElement() calls are always nested correctly. Empty element tags (e.g. <a/>) are reported by startElement() directly followed by a call to endElement(). The attribute list provided will contain only attributes with explicit values. The attribute list will contain attributes used for namespace declaration (i.e. attributes starting with xmlns) only if the namespace-prefix property of the reader is TRUE. The argument \a uri is the namespace URI, or the empty string if the element has no namespace URI or if namespace processing is not being performed, \a localName is the local name (without prefix), or the empty string if namespace processing is not being performed, \a qName is the qualified name (with prefix), or the empty string if qualified names are not available and \a atts are the attributes attached to the element. If there are no attributes, \a atts is an empty attributes object If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. See also the <a href="xml-sax.html#namespaces">namespace description</a>. \sa endElement() */ /*! \fn bool QXmlContentHandler::endElement( const QString& namespaceURI, const QString& localName, const QString& qName ) The reader calls this function when he has parsed an end element tag. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. See also the <a href="xml-sax.html#namespaces">namespace description</a>. \sa startElement() */ /*! \fn bool QXmlContentHandler::characters( const QString& ch ) The reader calls this function when he has parsed a chunk of character data (either normal character data or character data inside a CDATA section; if you have to distinguish between those two types you have to use QXmlLexicalHandler::startCDATA() and QXmlLexicalHandler::endCDATA() in addition). Some readers will report whitespace in element content using the ignorableWhitespace() function rather than this one (QXmlSimpleReader will do it not though). A reader is allowed to report the character data of an element in more than one chunk; e.g. a reader might want to report "a &lt; b" in three characters() events ("a ", "<" and " b"). If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlContentHandler::ignorableWhitespace( const QString& ch ) Some readers may use this function to report each chunk of whitespace in element content (QXmlSimpleReader does not though). If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlContentHandler::processingInstruction( const QString& target, const QString& data ) The reader calls this function when he has parsed a processing instruction. \a target is the target name of the processing instruction and \a data is the data of the processing instruction. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlContentHandler::skippedEntity( const QString& name ) Some readers may skip entities if they have not seen the declarations (e.g. because they are in an external DTD). If they do so they will report it by calling this function. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn QString QXmlContentHandler::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlErrorHandler qxml.h \brief The QXmlErrorHandler class provides an interface to report errors in XML data. \module XML If the application is interested in reporting errors to the user or any other customized error handling, you should subclass this class. You can set the error handler with QXmlReader::setErrorHandler(). See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlDeclHandler QXmlContentHandler QXmlEntityResolver QXmlLexicalHandler */ /*! \fn bool QXmlErrorHandler::warning( const QXmlParseException& exception ) A reader might use this function to report a warning. Warnings are conditions that are not errors or fatal errors as defined by the XML 1.0 specification. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlErrorHandler::error( const QXmlParseException& exception ) A reader might use this function to report a recoverable error. A recoverable error corresponds to the definiton of "error" in section 1.2 of the XML 1.0 specification. The reader must continue to provide normal parsing events after invoking this function. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlErrorHandler::fatalError( const QXmlParseException& exception ) A reader must use this function to report a non-recoverable error. If this function returns TRUE the reader might try to go on parsing and reporting further errors; but no regular parsing events are reported. */ /*! \fn QString QXmlErrorHandler::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlDTDHandler qxml.h \brief The QXmlDTDHandler class provides an interface to report DTD content of XML data. \module XML If an application needs information about notations and unparsed entities, then the application implements this interface and registers an instance with QXmlReader::setDTDHandler(). Note that this interface includes only those DTD events that the XML recommendation requires processors to report: notation and unparsed entity declarations. See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDeclHandler QXmlContentHandler QXmlEntityResolver QXmlErrorHandler QXmlLexicalHandler */ /*! \fn bool QXmlDTDHandler::notationDecl( const QString& name, const QString& publicId, const QString& systemId ) The reader calls this function when he has parsed a notation declaration. The argument \a name is the notation name, \a publicId is the notations's public identifier and \a systemId is the notations's system identifier. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlDTDHandler::unparsedEntityDecl( const QString& name, const QString& publicId, const QString& systemId, const QString& notationName ) The reader calls this function when he finds an unparsed entity declaration. The argument \a name is the unparsed entity's name, \a publicId is the entity's public identifier, \a systemId is the entity's system identifier and \a notation is the name of the associated notation. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn QString QXmlDTDHandler::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlEntityResolver qxml.h \brief The QXmlEntityResolver class provides an interface to resolve extern entities contained in XML data. \module XML If an application needs to implement customized handling for external entities, it must implement this interface and register it with QXmlReader::setEntityResolver(). See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlDeclHandler QXmlContentHandler QXmlErrorHandler QXmlLexicalHandler */ /*! \fn bool QXmlEntityResolver::resolveEntity( const QString& publicId, const QString& systemId, QXmlInputSource* ret ) The reader will call this function before he opens any external entity, except the top-level document entity. The application may request the reader to resolve the entity itself (\a ret is 0) or to use an entirely different input source (\a ret points to the input source). The reader will delete the input source \a ret when he no longer needs it. So you should allocate it on the heap with \c new. The argument \a publicId is the public identifier of the external entity, \a systemId is the system identifier of the external entity and \a ret is the return value of this function: if it is 0 the reader should resolve the entity itself, if it is non-zero it must point to an input source which the reader will use instead. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn QString QXmlEntityResolver::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlLexicalHandler qxml.h \brief The QXmlLexicalHandler class provides an interface to report lexical content of XML data. \module XML The events in the lexical handler apply to the entire document, not just to the document element, and all lexical handler events appear between the content handler's startDocument and endDocument events. You can set the lexical handler with QXmlReader::setLexicalHandler(). This interface is designed after the SAX2 extension LexicalHandler. The functions startEntity() and endEntity() are not included though. See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlDeclHandler QXmlContentHandler QXmlEntityResolver QXmlErrorHandler */ /*! \fn bool QXmlLexicalHandler::startDTD( const QString& name, const QString& publicId, const QString& systemId ) The reader calls this function to report the start of a DTD declaration, if any. All declarations reported through QXmlDTDHandler or QXmlDeclHandler appear between the startDTD() and endDTD() calls. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa endDTD() */ /*! \fn bool QXmlLexicalHandler::endDTD() The reader calls this function to report the end of a DTD declaration, if any. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa startDTD() */ /*! \fn bool QXmlLexicalHandler::startCDATA() The reader calls this function to report the start of a CDATA section. The content of the CDATA section will be reported through the regular QXmlContentHandler::characters(). This function is intended only to report the boundary. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa endCDATA() */ /*! \fn bool QXmlLexicalHandler::endCDATA() The reader calls this function to report the end of a CDATA section. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. \sa startCDATA() */ /*! \fn bool QXmlLexicalHandler::comment( const QString& ch ) The reader calls this function to report an XML comment anywhere in the document. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn QString QXmlLexicalHandler::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlDeclHandler qxml.h \brief The QXmlDeclHandler class provides an interface to report declaration content of XML data. \module XML You can set the declaration handler with QXmlReader::setDeclHandler(). This interface is designed after the SAX2 extension DeclHandler. See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlContentHandler QXmlEntityResolver QXmlErrorHandler QXmlLexicalHandler */ /*! \fn bool QXmlDeclHandler::attributeDecl( const QString& eName, const QString& aName, const QString& type, const QString& valueDefault, const QString& value ) The reader calls this function to report an attribute type declaration. Only the effective (first) declaration for an attribute will be reported. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlDeclHandler::internalEntityDecl( const QString& name, const QString& value ) The reader calls this function to report an internal entity declaration. Only the effective (first) declaration will be reported. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn bool QXmlDeclHandler::externalEntityDecl( const QString& name, const QString& publicId, const QString& systemId ) The reader calls this function to report a parsed external entity declaration. Only the effective (first) declaration for each entity will be reported. If this function returns FALSE the reader will stop parsing and will report an error. The reader will use the function errorString() to get the error message that will be used for reporting the error. */ /*! \fn QString QXmlDeclHandler::errorString() The reader calls this function to get an error string if any of the handler functions returns FALSE to him. */ /*! \class QXmlDefaultHandler qxml.h \brief The QXmlDefaultHandler class provides a default implementation of all XML handler classes. \module XML Very often you are only interested in parts of the things that that the reader reports to you. This class simply implements a default behaviour of the handler classes (most of the time: do nothing). Normally this is the class you subclass for implementing your customized handler. See also the <a href="xml.html#introSAX2">Introduction to SAX2</a>. \sa QXmlDTDHandler QXmlDeclHandler QXmlContentHandler QXmlEntityResolver QXmlErrorHandler QXmlLexicalHandler */ /*! \fn QXmlDefaultHandler::QXmlDefaultHandler() Constructor. */ /*! \fn QXmlDefaultHandler::~QXmlDefaultHandler() Destructor. */ /*! Does nothing. */ void QXmlDefaultHandler::setDocumentLocator( QXmlLocator* ) { } /*! Does nothing. */ bool QXmlDefaultHandler::startDocument() { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endDocument() { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::startPrefixMapping( const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endPrefixMapping( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::startElement( const QString&, const QString&, const QString&, const QXmlAttributes& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endElement( const QString&, const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::characters( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::ignorableWhitespace( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::processingInstruction( const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::skippedEntity( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::warning( const QXmlParseException& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::error( const QXmlParseException& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::fatalError( const QXmlParseException& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::notationDecl( const QString&, const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::unparsedEntityDecl( const QString&, const QString&, const QString&, const QString& ) { return TRUE; } /*! Always sets \a ret to 0, so that the reader will use the system identifier provided in the XML document. */ bool QXmlDefaultHandler::resolveEntity( const QString&, const QString&, QXmlInputSource* /* ret */ ) { /* ### This doesn't set anything to 0! ret = 0; */ return TRUE; } /*! Returns the default error string. */ QString QXmlDefaultHandler::errorString() { return QString( XMLERR_ERRORBYCONSUMER ); } /*! Does nothing. */ bool QXmlDefaultHandler::startDTD( const QString&, const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endDTD() { return TRUE; } #if 0 /*! Does nothing. */ bool QXmlDefaultHandler::startEntity( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endEntity( const QString& ) { return TRUE; } #endif /*! Does nothing. */ bool QXmlDefaultHandler::startCDATA() { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::endCDATA() { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::comment( const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::attributeDecl( const QString&, const QString&, const QString&, const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::internalEntityDecl( const QString&, const QString& ) { return TRUE; } /*! Does nothing. */ bool QXmlDefaultHandler::externalEntityDecl( const QString&, const QString&, const QString& ) { return TRUE; } /********************************************* * * QXmlSimpleReaderPrivate * *********************************************/ class QXmlSimpleReaderPrivate { private: // constructor QXmlSimpleReaderPrivate() { } // used for entity declarations struct ExternParameterEntity { ExternParameterEntity( ) {} ExternParameterEntity( const QString &p, const QString &s ) : publicId(p), systemId(s) {} QString publicId; QString systemId; }; struct ExternEntity { ExternEntity( ) {} ExternEntity( const QString &p, const QString &s, const QString &n ) : publicId(p), systemId(s), notation(n) {} QString publicId; QString systemId; QString notation; }; QMap<QString,ExternParameterEntity> externParameterEntities; QMap<QString,QString> parameterEntities; QMap<QString,ExternEntity> externEntities; QMap<QString,QString> entities; // used for standalone declaration enum Standalone { Yes, No, Unknown }; QString doctype; // only used for the doctype QString xmlVersion; // only used to store the version information QString encoding; // only used to store the encoding Standalone standalone; // used to store the value of the standalone declaration QString publicId; // used by parseExternalID() to store the public ID QString systemId; // used by parseExternalID() to store the system ID QString attDeclEName; // use by parseAttlistDecl() QString attDeclAName; // use by parseAttlistDecl() // flags for some features support bool useNamespaces; bool useNamespacePrefixes; bool reportWhitespaceCharData; bool reportEntities; // used to build the attribute list QXmlAttributes attList; // helper classes QXmlLocator *locator; QXmlNamespaceSupport namespaceSupport; // error string QString error; // friend declarations friend class QXmlSimpleReader; }; /********************************************* * * QXmlSimpleReader * *********************************************/ /*! \class QXmlReader qxml.h \brief The QXmlReader class provides an interface for XML readers (i.e. parsers). \module XML This abstract class describes an interface for all XML readers in Qt. At the moment there is only one implementation of a reader included in the XML module of Qt (QXmlSimpleReader). In future releases there might be more readers with different properties available (e.g. a validating parser). The design of the XML classes follow the <a href="http://www.megginson.com/SAX/">SAX2 java interface</a>. It was adopted to fit into the Qt naming conventions; so it should be very easy for anybody who has worked with SAX2 to get started with the Qt XML classes. All readers use the class QXmlInputSource to read the input document from. Since you are normally interested in certain contents of the XML document, the reader reports those contents through special handler classes (QXmlDTDHandler, QXmlDeclHandler, QXmlContentHandler, QXmlEntityResolver, QXmlErrorHandler and QXmlLexicalHandler). You have to subclass these classes. Since the handler classes describe only interfaces you must implement all functions; there is a class (QXmlDefaultHandler) to make this easier; it implements a default behaviour (do nothing) for all functions. For getting started see also the <a href="xml-sax.html#quickStart">Quick start</a>. \sa QXmlSimpleReader */ /*! \fn bool QXmlReader::feature( const QString& name, bool *ok ) const If the reader has the feature \a name, this function returns the value of the feature. If the reader has not the feature \a name, the return value may be anything. If \a ok is not 0, then \a ok is set to TRUE if the reader has the feature \a name, otherwise \a ok is set to FALSE. \sa setFeature() hasFeature() */ /*! \fn void QXmlReader::setFeature( const QString& name, bool value ) Sets the feature \a name to \a value. If the reader has not the feature \a name, this value is ignored. \sa feature() hasFeature() */ /*! \fn bool QXmlReader::hasFeature( const QString& name ) const Returns \c TRUE if the reader has the feature \a name, otherwise FALSE. \sa feature() setFeature() */ /*! \fn void* QXmlReader::property( const QString& name, bool *ok ) const If the reader has the property \a name, this function returns the value of the property. If the reader has not the property \a name, the return value is 0. If \a ok is not 0, then \a ok is set to TRUE if the reader has the property \a name, otherwise \a ok is set to FALSE. \sa setProperty() hasProperty() */ /*! \fn void QXmlReader::setProperty( const QString& name, void* value ) Sets the property \a name to \a value. If the reader has not the property \a name, this value is ignored. \sa property() hasProperty() */ /*! \fn bool QXmlReader::hasProperty( const QString& name ) const Returns TRUE if the reader has the property \a name, otherwise FALSE. \sa property() setProperty() */ /*! \fn void QXmlReader::setEntityResolver( QXmlEntityResolver* handler ) Sets the entity resolver to \a handler. \sa entityResolver() */ /*! \fn QXmlEntityResolver* QXmlReader::entityResolver() const Returns the entity resolver or 0 if none was set. \sa setEntityResolver() */ /*! \fn void QXmlReader::setDTDHandler( QXmlDTDHandler* handler ) Sets the DTD handler to \a handler. \sa DTDHandler() */ /*! \fn QXmlDTDHandler* QXmlReader::DTDHandler() const Returns the DTD handler or 0 if none was set. \sa setDTDHandler() */ /*! \fn void QXmlReader::setContentHandler( QXmlContentHandler* handler ) Sets the content handler to \a handler. \sa contentHandler() */ /*! \fn QXmlContentHandler* QXmlReader::contentHandler() const Returns the content handler or 0 if none was set. \sa setContentHandler() */ /*! \fn void QXmlReader::setErrorHandler( QXmlErrorHandler* handler ) Sets the error handler to \a handler. \sa errorHandler() */ /*! \fn QXmlErrorHandler* QXmlReader::errorHandler() const Returns the error handler or 0 if none was set \sa setErrorHandler() */ /*! \fn void QXmlReader::setLexicalHandler( QXmlLexicalHandler* handler ) Sets the lexical handler to \a handler. \sa lexicalHandler() */ /*! \fn QXmlLexicalHandler* QXmlReader::lexicalHandler() const Returns the lexical handler or 0 if none was set. \sa setLexicalHandler() */ /*! \fn void QXmlReader::setDeclHandler( QXmlDeclHandler* handler ) Sets the declaration handler to \a handler. \sa declHandler() */ /*! \fn QXmlDeclHandler* QXmlReader::declHandler() const Returns the declaration handler or 0 if none was set. \sa setDeclHandler() */ /*! \fn bool QXmlReader::parse( const QXmlInputSource& input ) Parses the XML document \a input. Returns TRUE if the parsing was successful, otherwise FALSE. */ /*! \fn bool QXmlReader::parse( const QString& systemId ) Parses the XML document at the location \a systemId. Returns TRUE if the parsing was successful, otherwise FALSE. */ /*! \class QXmlSimpleReader qxml.h \brief The QXmlSimpleReader class provides an implementation of a simple XML reader (i.e. parser). \module XML This XML reader is sufficient for simple parsing tasks. Here is a short list of the properties of this reader: <ul> <li> well-formed parser <li> does not parse any external entities <li> can do namespace processing </ul> For getting started see also the <a href="xml-sax.html#quickStart">Quick start</a>. */ //guaranteed not to be a characater const QChar QXmlSimpleReader::QEOF = QChar((ushort)0xffff); /*! Constructs a simple XML reader. */ QXmlSimpleReader::QXmlSimpleReader() { d = new QXmlSimpleReaderPrivate(); d->locator = new QXmlLocator( this ); entityRes = 0; dtdHnd = 0; contentHnd = 0; errorHnd = 0; lexicalHnd = 0; declHnd = 0; // default feature settings d->useNamespaces = TRUE; d->useNamespacePrefixes = FALSE; d->reportWhitespaceCharData = TRUE; d->reportEntities = FALSE; } /*! Destroys a simple XML reader. */ QXmlSimpleReader::~QXmlSimpleReader() { delete d->locator; delete d; } /*! Gets the state of a feature. \sa setFeature() hasFeature() */ bool QXmlSimpleReader::feature( const QString& name, bool *ok ) const { if ( ok != 0 ) *ok = TRUE; if ( name == "http://xml.org/sax/features/namespaces" ) { return d->useNamespaces; } else if ( name == "http://xml.org/sax/features/namespace-prefixes" ) { return d->useNamespacePrefixes; } else if ( name == "http://trolltech.com/xml/features/report-whitespace-only-CharData" ) { return d->reportWhitespaceCharData; } else if ( name == "http://trolltech.com/xml/features/report-start-end-entity" ) { return d->reportEntities; } else { qWarning( "Unknown feature " + name ); if ( ok != 0 ) *ok = FALSE; } return FALSE; } /*! Sets the state of a feature. Supported features are: <ul> <li> http://xml.org/sax/features/namespaces: if this feature is TRUE, namespace processing is performed <li> http://xml.org/sax/features/namespace-prefixes: if this feature is TRUE, the the original prefixed names and attributes used for namespace declarations are reported <li> http://trolltech.com/xml/features/report-whitespace-only-CharData: if this feature is TRUE, CharData that consists only of whitespace (and no other characters) is not reported via QXmlContentHandler::characters() </ul> \sa feature() hasFeature() */ void QXmlSimpleReader::setFeature( const QString& name, bool value ) { if ( name == "http://xml.org/sax/features/namespaces" ) { d->useNamespaces = value; } else if ( name == "http://xml.org/sax/features/namespace-prefixes" ) { d->useNamespacePrefixes = value; } else if ( name == "http://trolltech.com/xml/features/report-whitespace-only-CharData" ) { d->reportWhitespaceCharData = value; } else if ( name == "http://trolltech.com/xml/features/report-start-end-entity" ) { d->reportEntities = value; } else { qWarning( "Unknown feature " + name ); } } /*! Returns TRUE if the class has a feature named \a feature, otherwise FALSE. \sa setFeature() feature() */ bool QXmlSimpleReader::hasFeature( const QString& name ) const { if ( name == "http://xml.org/sax/features/namespaces" || name == "http://xml.org/sax/features/namespace-prefixes" || name == "http://trolltech.com/xml/features/report-whitespace-only-CharData" ) { return TRUE; } else { return FALSE; } } /*! Returns 0 since this class does not support any properties. */ void* QXmlSimpleReader::property( const QString&, bool *ok ) const { if ( ok != 0 ) *ok = FALSE; return 0; } /*! Does nothing since this class does not support any properties. */ void QXmlSimpleReader::setProperty( const QString&, void* ) { } /*! Returns FALSE since this class does not support any properties. */ bool QXmlSimpleReader::hasProperty( const QString& ) const { return FALSE; } /*! \reimp */ void QXmlSimpleReader::setEntityResolver( QXmlEntityResolver* handler ) { entityRes = handler; } /*! \reimp */ QXmlEntityResolver* QXmlSimpleReader::entityResolver() const { return entityRes; } /*! \reimp */ void QXmlSimpleReader::setDTDHandler( QXmlDTDHandler* handler ) { dtdHnd = handler; } /*! \reimp */ QXmlDTDHandler* QXmlSimpleReader::DTDHandler() const { return dtdHnd; } /*! \reimp */ void QXmlSimpleReader::setContentHandler( QXmlContentHandler* handler ) { contentHnd = handler; } /*! \reimp */ QXmlContentHandler* QXmlSimpleReader::contentHandler() const { return contentHnd; } /*! \reimp */ void QXmlSimpleReader::setErrorHandler( QXmlErrorHandler* handler ) { errorHnd = handler; } /*! \reimp */ QXmlErrorHandler* QXmlSimpleReader::errorHandler() const { return errorHnd; } /*! \reimp */ void QXmlSimpleReader::setLexicalHandler( QXmlLexicalHandler* handler ) { lexicalHnd = handler; } /*! \reimp */ QXmlLexicalHandler* QXmlSimpleReader::lexicalHandler() const { return lexicalHnd; } /*! \reimp */ void QXmlSimpleReader::setDeclHandler( QXmlDeclHandler* handler ) { declHnd = handler; } /*! \reimp */ QXmlDeclHandler* QXmlSimpleReader::declHandler() const { return declHnd; } /*! \reimp */ bool QXmlSimpleReader::parse( const QXmlInputSource& input ) { init( input ); // call the handler if ( contentHnd ) { contentHnd->setDocumentLocator( d->locator ); if ( !contentHnd->startDocument() ) { d->error = contentHnd->errorString(); goto parseError; } } // parse prolog if ( !parseProlog() ) { d->error = XMLERR_ERRORPARSINGPROLOG; goto parseError; } // parse element if ( !parseElement() ) { d->error = XMLERR_ERRORPARSINGMAINELEMENT; goto parseError; } // parse Misc* while ( !atEnd() ) { if ( !parseMisc() ) { d->error = XMLERR_ERRORPARSINGMISC; goto parseError; } } // is stack empty? if ( !tags.isEmpty() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } // call the handler if ( contentHnd ) { if ( !contentHnd->endDocument() ) { d->error = contentHnd->errorString(); goto parseError; } } return TRUE; // error handling parseError: reportParseError(); tags.clear(); return FALSE; } /*! Parses the prolog [22]. */ bool QXmlSimpleReader::parseProlog() { bool xmldecl_possible = TRUE; bool doctype_read = FALSE; const signed char Init = 0; const signed char EatWS = 1; // eat white spaces const signed char Lt = 2; // '<' read const signed char Em = 3; // '!' read const signed char DocType = 4; // read doctype const signed char Comment = 5; // read comment const signed char PI = 6; // read PI const signed char Done = 7; const signed char InpWs = 0; const signed char InpLt = 1; // < const signed char InpQm = 2; // ? const signed char InpEm = 3; // ! const signed char InpD = 4; // D const signed char InpDash = 5; // - const signed char InpUnknown = 6; // use some kind of state machine for parsing static const signed char table[7][7] = { /* InpWs InpLt InpQm InpEm InpD InpDash InpUnknown */ { EatWS, Lt, -1, -1, -1, -1, -1 }, // Init { -1, Lt, -1, -1, -1, -1, -1 }, // EatWS { -1, -1, PI, Em, Done, -1, Done }, // Lt { -1, -1, -1, -1, DocType, Comment, -1 }, // Em { EatWS, Lt, -1, -1, -1, -1, -1 }, // DocType { EatWS, Lt, -1, -1, -1, -1, -1 }, // Comment { EatWS, Lt, -1, -1, -1, -1, -1 } // PI }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // read input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '<' ) { input = InpLt; } else if ( c == '?' ) { input = InpQm; } else if ( c == '!' ) { input = InpEm; } else if ( c == 'D' ) { input = InpD; } else if ( c == '-' ) { input = InpDash; } else { input = InpUnknown; } // get new state state = table[state][input]; // in some cases do special actions depending on state switch ( state ) { case EatWS: // XML declaration only on first position possible xmldecl_possible = FALSE; // eat white spaces eat_ws(); break; case Lt: // next character next(); break; case Em: // XML declaration only on first position possible xmldecl_possible = FALSE; // next character next(); break; case DocType: parseOk = parseDoctype(); break; case Comment: parseOk = parseComment(); break; case PI: parseOk = parsePI( xmldecl_possible ); break; } // no input is read after this switch ( state ) { case DocType: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPROLOG; goto parseError; } if ( doctype_read ) { d->error = XMLERR_MORETHANONEDOCTYPE; goto parseError; } else { doctype_read = FALSE; } break; case Comment: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPROLOG; goto parseError; } if ( lexicalHnd ) { if ( !lexicalHnd->comment( string() ) ) { d->error = lexicalHnd->errorString(); goto parseError; } } break; case PI: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPROLOG; goto parseError; } // call the handler if ( contentHnd ) { if ( xmldecl_possible && !d->xmlVersion.isEmpty() ) { QString value( "version = '" ); value += d->xmlVersion; value += "'"; if ( !d->encoding.isEmpty() ) { value += " encoding = '"; value += d->encoding; value += "'"; } if ( d->standalone == QXmlSimpleReaderPrivate::Yes ) { value += " standalone = 'yes'"; } else if ( d->standalone == QXmlSimpleReaderPrivate::No ) { value += " standalone = 'no'"; } if ( !contentHnd->processingInstruction( "xml", value ) ) { d->error = contentHnd->errorString(); goto parseError; } } else { if ( !contentHnd->processingInstruction( name(), string() ) ) { d->error = contentHnd->errorString(); goto parseError; } } } // XML declaration only on first position possible xmldecl_possible = FALSE; break; case Done: return TRUE; case -1: d->error = XMLERR_ERRORPARSINGELEMENT; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse an element [39]. Precondition: the opening '<' is already read. */ bool QXmlSimpleReader::parseElement() { QString uri, lname, prefix; bool t; const signed char Init = 0; const signed char ReadName = 1; const signed char Ws1 = 2; const signed char STagEnd = 3; const signed char STagEnd2 = 4; const signed char ETagBegin = 5; const signed char ETagBegin2 = 6; const signed char Ws2 = 7; const signed char EmptyTag = 8; const signed char Attribute = 9; const signed char Ws3 = 10; const signed char Done = 11; const signed char InpWs = 0; // whitespace const signed char InpNameBe = 1; // is_NameBeginning() const signed char InpGt = 2; // > const signed char InpSlash = 3; // / const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[11][5] = { /* InpWs InpNameBe InpGt InpSlash InpUnknown */ { -1, ReadName, -1, -1, -1 }, // Init { Ws1, Attribute, STagEnd, EmptyTag, -1 }, // ReadName { -1, Attribute, STagEnd, EmptyTag, -1 }, // Ws1 { STagEnd2, STagEnd2, STagEnd2, STagEnd2, STagEnd2 }, // STagEnd { -1, -1, -1, ETagBegin, -1 }, // STagEnd2 { -1, ETagBegin2, -1, -1, -1 }, // ETagBegin { Ws2, -1, Done, -1, -1 }, // ETagBegin2 { -1, -1, Done, -1, -1 }, // Ws2 { -1, -1, Done, -1, -1 }, // EmptyTag { Ws3, Attribute, STagEnd, EmptyTag, -1 }, // Attribute { -1, Attribute, STagEnd, EmptyTag, -1 } // Ws3 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // read input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( is_NameBeginning(c) ) { input = InpNameBe; } else if ( c == '>' ) { input = InpGt; } else if ( c == '/' ) { input = InpSlash; } else { input = InpUnknown; } // get new state //qDebug( "%d -%d(%c)-> %d", state, input, c.latin1(), table[state][input] ); state = table[state][input]; // in some cases do special actions depending on state switch ( state ) { case ReadName: parseOk = parseName(); break; case Ws1: case Ws2: case Ws3: eat_ws(); break; case STagEnd: // call the handler if ( contentHnd ) { if ( d->useNamespaces ) { d->namespaceSupport.processName( tags.top(), FALSE, uri, lname ); t = contentHnd->startElement( uri, lname, tags.top(), d->attList ); } else { t = contentHnd->startElement( "", "", tags.top(), d->attList ); } if ( !t ) { d->error = contentHnd->errorString(); goto parseError; } } next(); break; case STagEnd2: parseOk = parseContent(); break; case ETagBegin: next(); break; case ETagBegin2: // get the name of the tag parseOk = parseName(); break; case EmptyTag: if ( tags.isEmpty() ) { d->error = XMLERR_TAGMISMATCH; goto parseError; } if ( !parseElementEmptyTag( t, uri, lname ) ) goto parseError; // next character next(); break; case Attribute: // get name and value of attribute parseOk = parseAttribute(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case ReadName: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } // store it on the stack tags.push( name() ); // empty the attributes d->attList.qnameList.clear(); d->attList.uriList.clear(); d->attList.localnameList.clear(); d->attList.valueList.clear(); // namespace support? if ( d->useNamespaces ) { d->namespaceSupport.pushContext(); } break; case STagEnd2: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCONTENT; goto parseError; } break; case ETagBegin2: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } if ( !parseElementETagBegin2() ) goto parseError; break; case Attribute: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGATTRIBUTE; goto parseError; } if ( !parseElementAttribute( prefix, uri, lname ) ) goto parseError; break; case Done: return TRUE; case -1: d->error = XMLERR_ERRORPARSINGELEMENT; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Helper to break down the size of the code in the case statement. Return FALSE on error, otherwise TRUE. */ // ### Remove t argument in Qt 3.0 -- I don't need it. The same should be true for uri and lname. bool QXmlSimpleReader::parseElementEmptyTag( bool &, QString &uri, QString &lname ) { // pop the stack and call the handler if ( contentHnd ) { if ( d->useNamespaces ) { // report startElement first... d->namespaceSupport.processName( tags.top(), FALSE, uri, lname ); if ( !contentHnd->startElement( uri, lname, tags.top(), d->attList ) ) { goto error; } // ... followed by endElement... if ( !contentHnd->endElement( uri, lname, tags.pop() ) ) { goto error; } // ... followed by endPrefixMapping QStringList prefixesBefore, prefixesAfter; if ( contentHnd ) { prefixesBefore = d->namespaceSupport.prefixes(); } d->namespaceSupport.popContext(); // call the handler for prefix mapping prefixesAfter = d->namespaceSupport.prefixes(); for ( QStringList::Iterator it = prefixesBefore.begin(); it != prefixesBefore.end(); ++it ) { if ( prefixesAfter.contains(*it) == 0 ) { if ( !contentHnd->endPrefixMapping( *it ) ) { goto error; } } } } else { // report startElement first... if ( !contentHnd->startElement( "", "", tags.top(), d->attList ) ) { goto error; } // ... followed by endElement if ( !contentHnd->endElement( "","",tags.pop() ) ) { goto error; } } } else { tags.pop(); d->namespaceSupport.popContext(); } return TRUE; error: d->error = contentHnd->errorString(); return FALSE; } /*! Helper to break down the size of the code in the case statement. Return FALSE on error, otherwise TRUE. */ bool QXmlSimpleReader::parseElementETagBegin2() { // pop the stack and compare it with the name if ( tags.pop() != name() ) { d->error = XMLERR_TAGMISMATCH; return FALSE; } // call the handler if ( contentHnd ) { if ( d->useNamespaces ) { QString uri, lname; d->namespaceSupport.processName( name(), FALSE, uri, lname ); if ( !contentHnd->endElement( uri, lname, name() ) ) { d->error = contentHnd->errorString(); return FALSE; } } else { if ( !contentHnd->endElement("","",name()) ) { d->error = contentHnd->errorString(); return FALSE; } } } if ( d->useNamespaces ) { QStringList prefixesBefore, prefixesAfter; if ( contentHnd ) { prefixesBefore = d->namespaceSupport.prefixes(); } d->namespaceSupport.popContext(); // call the handler for prefix mapping if ( contentHnd ) { prefixesAfter = d->namespaceSupport.prefixes(); for ( QStringList::Iterator it = prefixesBefore.begin(); it != prefixesBefore.end(); ++it ) { if ( prefixesAfter.contains(*it) == 0 ) { if ( !contentHnd->endPrefixMapping( *it ) ) { d->error = contentHnd->errorString(); return FALSE; } } } } } return TRUE; } /*! Helper to break down the size of the code in the case statement. Return FALSE on error, otherwise TRUE. */ // ### Remove arguments in Qt 3.0? I think, I don't need them. bool QXmlSimpleReader::parseElementAttribute( QString &prefix, QString &uri, QString &lname ) { // add the attribute to the list if ( d->useNamespaces ) { // is it a namespace declaration? d->namespaceSupport.splitName( name(), prefix, lname ); if ( prefix == "xmlns" ) { // namespace declaration d->namespaceSupport.setPrefix( lname, string() ); if ( d->useNamespacePrefixes ) { d->attList.qnameList.append( name() ); d->attList.uriList.append( "" ); d->attList.localnameList.append( "" ); d->attList.valueList.append( string() ); } // call the handler for prefix mapping if ( contentHnd ) { if ( !contentHnd->startPrefixMapping( lname, string() ) ) { d->error = contentHnd->errorString(); return FALSE; } } } else { // no namespace delcaration d->namespaceSupport.processName( name(), TRUE, uri, lname ); d->attList.qnameList.append( name() ); d->attList.uriList.append( uri ); d->attList.localnameList.append( lname ); d->attList.valueList.append( string() ); } } else { // no namespace support d->attList.qnameList.append( name() ); d->attList.uriList.append( "" ); d->attList.localnameList.append( "" ); d->attList.valueList.append( string() ); } return TRUE; } /*! Parse a content [43]. A content is only used between tags. If a end tag is found the < is already read and the head stand on the '/' of the end tag '</name>'. */ bool QXmlSimpleReader::parseContent() { bool charDataRead = FALSE; const signed char Init = 0; const signed char ChD = 1; // CharData const signed char ChD1 = 2; // CharData help state const signed char ChD2 = 3; // CharData help state const signed char Ref = 4; // Reference const signed char Lt = 5; // '<' read const signed char PI = 6; // PI const signed char Elem = 7; // Element const signed char Em = 8; // '!' read const signed char Com = 9; // Comment const signed char CDS = 10; // CDSect const signed char CDS1 = 11; // read a CDSect const signed char CDS2 = 12; // read a CDSect (help state) const signed char CDS3 = 13; // read a CDSect (help state) const signed char Done = 14; // finished reading content const signed char InpLt = 0; // < const signed char InpGt = 1; // > const signed char InpSlash = 2; // / const signed char InpQMark = 3; // ? const signed char InpEMark = 4; // ! const signed char InpAmp = 5; // & const signed char InpDash = 6; // - const signed char InpOpenB = 7; // [ const signed char InpCloseB = 8; // ] const signed char InpUnknown = 9; static const signed char mapCLT2FSMChar[] = { InpUnknown, // white space InpUnknown, // % InpAmp, // & InpGt, // > InpLt, // < InpSlash, // / InpQMark, // ? InpEMark, // ! InpDash, // - InpCloseB, // ] InpOpenB, // [ InpUnknown, // = InpUnknown, // " InpUnknown, // ' InpUnknown // unknown }; // use some kind of state machine for parsing static const signed char table[14][10] = { /* InpLt InpGt InpSlash InpQMark InpEMark InpAmp InpDash InpOpenB InpCloseB InpUnknown */ { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD1, ChD }, // Init { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD1, ChD }, // ChD { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD2, ChD }, // ChD1 { Lt, -1, ChD, ChD, ChD, Ref, ChD, ChD, ChD2, ChD }, // ChD2 { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD, ChD }, // Ref (same as Init) { -1, -1, Done, PI, Em, -1, -1, -1, -1, Elem }, // Lt { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD, ChD }, // PI (same as Init) { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD, ChD }, // Elem (same as Init) { -1, -1, -1, -1, -1, -1, Com, CDS, -1, -1 }, // Em { Lt, ChD, ChD, ChD, ChD, Ref, ChD, ChD, ChD, ChD }, // Com (same as Init) { CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS2, CDS1 }, // CDS { CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS2, CDS1 }, // CDS1 { CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS3, CDS1 }, // CDS2 { CDS1, Init, CDS1, CDS1, CDS1, CDS1, CDS1, CDS1, CDS3, CDS1 } // CDS3 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input (use lookup-table instead of nested ifs for performance // reasons) if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c.row() ) { input = InpUnknown; } else { input = mapCLT2FSMChar[ charLookupTable[ c.cell() ] ]; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Init: // next character next(); break; case ChD: // on first call: clear string if ( !charDataRead ) { charDataRead = TRUE; stringClear(); } stringAddC(); next(); break; case ChD1: // on first call: clear string if ( !charDataRead ) { charDataRead = TRUE; stringClear(); } stringAddC(); next(); break; case ChD2: stringAddC(); next(); break; case Ref: if ( !charDataRead) { // reference may be CharData; so clear string to be safe stringClear(); parseOk = parseReference( charDataRead, InContent ); } else { if ( d->reportEntities ) { // this is undocumented so far; do this right in Qt 3.0 if ( contentHnd ) { if ( d->reportWhitespaceCharData || !string().simplifyWhiteSpace().isEmpty() ) { if ( !contentHnd->characters( string() ) ) { d->error = contentHnd->errorString(); goto parseError; } } } stringClear(); } bool tmp; parseOk = parseReference( tmp, InContent ); } break; case Lt: // call the handler for CharData if ( contentHnd ) { if ( charDataRead ) { if ( d->reportWhitespaceCharData || !string().simplifyWhiteSpace().isEmpty() ) { if ( !contentHnd->characters( string() ) ) { d->error = contentHnd->errorString(); goto parseError; } } } } charDataRead = FALSE; // next character next(); break; case PI: parseOk = parsePI(); break; case Elem: parseOk = parseElement(); break; case Em: // next character next(); break; case Com: parseOk = parseComment(); break; case CDS: parseOk = parseString( "[CDATA[" ); break; case CDS1: // read one character and add it stringAddC(); next(); break; case CDS2: // skip ']' next(); break; case CDS3: // skip ']'... next(); break; } // no input is read after this switch ( state ) { case Ref: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } break; case PI: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPI; goto parseError; } // call the handler if ( contentHnd ) { if ( !contentHnd->processingInstruction(name(),string()) ) { d->error = contentHnd->errorString(); goto parseError; } } break; case Elem: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGELEMENT; goto parseError; } break; case Com: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCOMMENT; goto parseError; } if ( lexicalHnd ) { if ( !lexicalHnd->comment( string() ) ) { d->error = lexicalHnd->errorString(); goto parseError; } } break; case CDS: if( !parseOk ) { d->error = XMLERR_CDSECTHEADEREXPECTED; goto parseError; } // empty string stringClear(); break; case CDS2: if (c != ']') { stringAddC( ']' ); } break; case CDS3: // test if this skipping was legal if ( c == '>' ) { // the end of the CDSect if ( lexicalHnd ) { if ( !lexicalHnd->startCDATA() ) { d->error = lexicalHnd->errorString(); goto parseError; } } if ( contentHnd ) { if ( !contentHnd->characters( string() ) ) { d->error = contentHnd->errorString(); goto parseError; } } if ( lexicalHnd ) { if ( !lexicalHnd->endCDATA() ) { d->error = lexicalHnd->errorString(); goto parseError; } } } else if (c == ']') { // three or more ']' stringAddC( ']' ); } else { // after ']]' comes another character stringAddC( ']' ); stringAddC( ']' ); } break; case Done: // call the handler for CharData if ( contentHnd ) { if ( charDataRead ) { if ( d->reportWhitespaceCharData || !string().simplifyWhiteSpace().isEmpty() ) { if ( !contentHnd->characters( string() ) ) { d->error = contentHnd->errorString(); goto parseError; } } } } // Done return TRUE; case -1: // Error d->error = XMLERR_ERRORPARSINGCONTENT; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse Misc [27]. */ bool QXmlSimpleReader::parseMisc() { const signed char Init = 0; const signed char Lt = 1; // '<' was read const signed char Comment = 2; // read comment const signed char eatWS = 3; // eat whitespaces const signed char PI = 4; // read PI const signed char Comment2 = 5; // read comment const signed char InpWs = 0; // S const signed char InpLt = 1; // < const signed char InpQm = 2; // ? const signed char InpEm = 3; // ! const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[3][5] = { /* InpWs InpLt InpQm InpEm InpUnknown */ { eatWS, Lt, -1, -1, -1 }, // Init { -1, -1, PI, Comment, -1 }, // Lt { -1, -1, -1, -1, Comment2 } // Comment }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '<' ) { input = InpLt; } else if ( c == '?' ) { input = InpQm; } else if ( c == '!' ) { input = InpEm; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case eatWS: eat_ws(); break; case Lt: next(); break; case PI: parseOk = parsePI(); break; case Comment: next(); break; case Comment2: parseOk = parseComment(); break; } // no input is read after this switch ( state ) { case eatWS: return TRUE; case PI: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPI; goto parseError; } if ( contentHnd ) { if ( !contentHnd->processingInstruction(name(),string()) ) { d->error = contentHnd->errorString(); goto parseError; } } return TRUE; case Comment2: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCOMMENT; goto parseError; } if ( lexicalHnd ) { if ( !lexicalHnd->comment( string() ) ) { d->error = lexicalHnd->errorString(); goto parseError; } } return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a processing instruction [16]. If xmldec is TRUE, it tries to parse a PI or a XML declaration [23]. Precondition: the beginning '<' of the PI is already read and the head stand on the '?' of '<?'. If this funktion was successful, the head-position is on the first character after the PI. */ bool QXmlSimpleReader::parsePI( bool xmldecl ) { const signed char Init = 0; const signed char QmI = 1; // ? was read const signed char Name = 2; // read Name const signed char XMLDecl = 3; // read XMLDecl const signed char Ws1 = 4; // eat ws after "xml" of XMLDecl const signed char PI = 5; // read PI const signed char Ws2 = 6; // eat ws after Name of PI const signed char Version = 7; // read versionInfo const signed char Ws3 = 8; // eat ws after versionInfo const signed char EorSD = 9; // read EDecl or SDDecl const signed char Ws4 = 10; // eat ws after EDecl or SDDecl const signed char SD = 11; // read SDDecl const signed char Ws5 = 12; // eat ws after SDDecl const signed char ADone = 13; // almost done const signed char Char = 14; // Char was read const signed char Qm = 15; // Qm was read const signed char Done = 16; // finished reading content const signed char InpWs = 0; // whitespace const signed char InpNameBe = 1; // is_nameBeginning() const signed char InpGt = 2; // > const signed char InpQm = 3; // ? const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[16][5] = { /* InpWs, InpNameBe InpGt InpQm InpUnknown */ { -1, -1, -1, QmI, -1 }, // Init { -1, Name, -1, -1, -1 }, // QmI { -1, -1, -1, -1, -1 }, // Name (this state is left not through input) { Ws1, -1, -1, -1, -1 }, // XMLDecl { -1, Version, -1, -1, -1 }, // Ws1 { Ws2, -1, -1, Qm, -1 }, // PI { Char, Char, Char, Qm, Char }, // Ws2 { Ws3, -1, -1, ADone, -1 }, // Version { -1, EorSD, -1, ADone, -1 }, // Ws3 { Ws4, -1, -1, ADone, -1 }, // EorSD { -1, SD, -1, ADone, -1 }, // Ws4 { Ws5, -1, -1, ADone, -1 }, // SD { -1, -1, -1, ADone, -1 }, // Ws5 { -1, -1, Done, -1, -1 }, // ADone { Char, Char, Char, Qm, Char }, // Char { Char, Char, Done, Qm, Char }, // Qm }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( is_NameBeginning(c) ) { input = InpNameBe; } else if ( c == '>' ) { input = InpGt; } else if ( c == '?' ) { input = InpQm; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case QmI: next(); break; case Name: parseOk = parseName(); break; case Ws1: case Ws2: case Ws3: case Ws4: case Ws5: eat_ws(); break; case Version: parseOk = parseAttribute(); break; case EorSD: parseOk = parseAttribute(); break; case SD: // get the SDDecl (syntax like an attribute) if ( d->standalone != QXmlSimpleReaderPrivate::Unknown ) { // already parsed the standalone declaration d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } parseOk = parseAttribute(); break; case ADone: next(); break; case Char: stringAddC(); next(); break; case Qm: // skip the '?' next(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Name: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } // test what name was read and determine the next state // (not very beautiful, I admit) if ( name().lower() == "xml" ) { if ( xmldecl && name()=="xml" ) { state = XMLDecl; } else { d->error = XMLERR_INVALIDNAMEFORPI; goto parseError; } } else { state = PI; stringClear(); } break; case Version: // get version (syntax like an attribute) if ( !parseOk ) { d->error = XMLERR_VERSIONEXPECTED; goto parseError; } if ( name() != "version" ) { d->error = XMLERR_VERSIONEXPECTED; goto parseError; } d->xmlVersion = string(); break; case EorSD: // get the EDecl or SDDecl (syntax like an attribute) if ( !parseOk ) { d->error = XMLERR_EDECLORSDDECLEXPECTED; goto parseError; } if ( name() == "standalone" ) { if ( string()=="yes" ) { d->standalone = QXmlSimpleReaderPrivate::Yes; } else if ( string()=="no" ) { d->standalone = QXmlSimpleReaderPrivate::No; } else { d->error = XMLERR_WRONGVALUEFORSDECL; goto parseError; } } else if ( name() == "encoding" ) { d->encoding = string(); } else { d->error = XMLERR_EDECLORSDDECLEXPECTED; goto parseError; } break; case SD: if ( !parseOk ) { d->error = XMLERR_SDDECLEXPECTED; goto parseError; } if ( name() != "standalone" ) { d->error = XMLERR_SDDECLEXPECTED; goto parseError; } if ( string()=="yes" ) { d->standalone = QXmlSimpleReaderPrivate::Yes; } else if ( string()=="no" ) { d->standalone = QXmlSimpleReaderPrivate::No; } else { d->error = XMLERR_WRONGVALUEFORSDECL; goto parseError; } break; case Qm: // test if the skipping was legal if ( c != '>' ) { stringAddC( '?' ); } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a document type definition (doctypedecl [28]). Precondition: the beginning '<!' of the doctype is already read the head stands on the 'D' of '<!DOCTYPE'. If this funktion was successful, the head-position is on the first character after the document type definition. */ bool QXmlSimpleReader::parseDoctype() { // some init-stuff d->systemId = QString::null; d->publicId = QString::null; const signed char Init = 0; const signed char Doctype = 1; // read the doctype const signed char Ws1 = 2; // eat_ws const signed char Doctype2 = 3; // read the doctype, part 2 const signed char Ws2 = 4; // eat_ws const signed char Sys = 5; // read SYSTEM const signed char Ws3 = 6; // eat_ws const signed char MP = 7; // markupdecl or PEReference const signed char PER = 8; // PERReference const signed char Mup = 9; // markupdecl const signed char Ws4 = 10; // eat_ws const signed char MPE = 11; // end of markupdecl or PEReference const signed char Done = 12; const signed char InpWs = 0; const signed char InpD = 1; // 'D' const signed char InpS = 2; // 'S' or 'P' const signed char InpOB = 3; // [ const signed char InpCB = 4; // ] const signed char InpPer = 5; // % const signed char InpGt = 6; // > const signed char InpUnknown = 7; // use some kind of state machine for parsing static const signed char table[12][8] = { /* InpWs, InpD InpS InpOB InpCB InpPer InpGt InpUnknown */ { -1, Doctype, -1, -1, -1, -1, -1, -1 }, // Init { Ws1, Doctype2, Doctype2, -1, -1, -1, -1, Doctype2 }, // Doctype { -1, Doctype2, Doctype2, -1, -1, -1, -1, Doctype2 }, // Ws1 { Ws2, -1, Sys, MP, -1, -1, Done, -1 }, // Doctype2 { -1, -1, Sys, MP, -1, -1, Done, -1 }, // Ws2 { Ws3, -1, -1, MP, -1, -1, Done, -1 }, // Sys { -1, -1, -1, MP, -1, -1, Done, -1 }, // Ws3 { -1, -1, -1, -1, MPE, PER, -1, Mup }, // MP { Ws4, -1, -1, -1, MPE, PER, -1, Mup }, // PER { Ws4, -1, -1, -1, MPE, PER, -1, Mup }, // Mup { -1, -1, -1, -1, MPE, PER, -1, Mup }, // Ws4 { -1, -1, -1, -1, -1, -1, Done, -1 } // MPE }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == 'D' ) { input = InpD; } else if ( c == 'S' ) { input = InpS; } else if ( c == 'P' ) { input = InpS; } else if ( c == '[' ) { input = InpOB; } else if ( c == ']' ) { input = InpCB; } else if ( c == '%' ) { input = InpPer; } else if ( c == '>' ) { input = InpGt; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Doctype: parseOk = parseString( "DOCTYPE" ); break; case Ws1: case Ws2: case Ws3: case Ws4: eat_ws(); break; case Doctype2: parseName(); break; case Sys: parseOk = parseExternalID(); break; case MP: next_eat_ws(); break; case PER: parseOk = parsePEReference( InDTD ); break; case Mup: parseOk = parseMarkupdecl(); break; case MPE: next_eat_ws(); break; case Done: if ( lexicalHnd ) { if ( !lexicalHnd->endDTD() ) { d->error = lexicalHnd->errorString(); goto parseError; } } next(); break; } // no input is read after this switch ( state ) { case Doctype: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } if ( !is_S(c) ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } break; case Doctype2: d->doctype = name(); if ( lexicalHnd ) { if ( !lexicalHnd->startDTD( d->doctype, d->publicId, d->systemId ) ) { d->error = lexicalHnd->errorString(); goto parseError; } } break; case Sys: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } break; case PER: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } break; case Mup: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a ExternalID [75]. If allowPublicID is TRUE parse ExternalID [75] or PublicID [83]. */ bool QXmlSimpleReader::parseExternalID( bool allowPublicID ) { // some init-stuff d->systemId = QString::null; d->publicId = QString::null; const signed char Init = 0; const signed char Sys = 1; // parse 'SYSTEM' const signed char SysWS = 2; // parse the whitespace after 'SYSTEM' const signed char SysSQ = 3; // parse SystemLiteral with ' const signed char SysSQ2 = 4; // parse SystemLiteral with ' const signed char SysDQ = 5; // parse SystemLiteral with " const signed char SysDQ2 = 6; // parse SystemLiteral with " const signed char Pub = 7; // parse 'PUBLIC' const signed char PubWS = 8; // parse the whitespace after 'PUBLIC' const signed char PubSQ = 9; // parse PubidLiteral with ' const signed char PubSQ2 = 10; // parse PubidLiteral with ' const signed char PubDQ = 11; // parse PubidLiteral with " const signed char PubDQ2 = 12; // parse PubidLiteral with " const signed char PubE = 13; // finished parsing the PubidLiteral const signed char PubWS2 = 14; // parse the whitespace after the PubidLiteral const signed char PDone = 15; // done if allowPublicID is TRUE const signed char Done = 16; const signed char InpSQ = 0; // ' const signed char InpDQ = 1; // " const signed char InpS = 2; // S const signed char InpP = 3; // P const signed char InpWs = 4; // white space const signed char InpUnknown = 5; // use some kind of state machine for parsing static const signed char table[15][6] = { /* InpSQ InpDQ InpS InpP InpWs InpUnknown */ { -1, -1, Sys, Pub, -1, -1 }, // Init { -1, -1, -1, -1, SysWS, -1 }, // Sys { SysSQ, SysDQ, -1, -1, -1, -1 }, // SysWS { Done, SysSQ2, SysSQ2, SysSQ2, SysSQ2, SysSQ2 }, // SysSQ { Done, SysSQ2, SysSQ2, SysSQ2, SysSQ2, SysSQ2 }, // SysSQ2 { SysDQ2, Done, SysDQ2, SysDQ2, SysDQ2, SysDQ2 }, // SysDQ { SysDQ2, Done, SysDQ2, SysDQ2, SysDQ2, SysDQ2 }, // SysDQ2 { -1, -1, -1, -1, PubWS, -1 }, // Pub { PubSQ, PubDQ, -1, -1, -1, -1 }, // PubWS { PubE, -1, PubSQ2, PubSQ2, PubSQ2, PubSQ2 }, // PubSQ { PubE, -1, PubSQ2, PubSQ2, PubSQ2, PubSQ2 }, // PubSQ2 { -1, PubE, PubDQ2, PubDQ2, PubDQ2, PubDQ2 }, // PubDQ { -1, PubE, PubDQ2, PubDQ2, PubDQ2, PubDQ2 }, // PubDQ2 { PDone, PDone, PDone, PDone, PubWS2, PDone }, // PubE { SysSQ, SysDQ, PDone, PDone, PDone, PDone } // PubWS2 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '\'' ) { input = InpSQ; } else if ( c == '"' ) { input = InpDQ; } else if ( c == 'S' ) { input = InpS; } else if ( c == 'P' ) { input = InpP; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Sys: parseOk = parseString( "SYSTEM" ); break; case SysWS: eat_ws(); break; case SysSQ: case SysDQ: stringClear(); next(); break; case SysSQ2: case SysDQ2: stringAddC(); next(); break; case Pub: parseOk = parseString( "PUBLIC" ); break; case PubWS: eat_ws(); break; case PubSQ: case PubDQ: stringClear(); next(); break; case PubSQ2: case PubDQ2: stringAddC(); next(); break; case PubE: next(); break; case PubWS2: d->publicId = string(); eat_ws(); break; case Done: d->systemId = string(); next(); break; } // no input is read after this switch ( state ) { case Sys: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Pub: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case PDone: if ( allowPublicID ) { d->publicId = string(); return TRUE; } else { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a markupdecl [29]. */ bool QXmlSimpleReader::parseMarkupdecl() { const signed char Init = 0; const signed char Lt = 1; // < was read const signed char Em = 2; // ! was read const signed char CE = 3; // E was read const signed char Qm = 4; // ? was read const signed char Dash = 5; // - was read const signed char CA = 6; // A was read const signed char CEL = 7; // EL was read const signed char CEN = 8; // EN was read const signed char CN = 9; // N was read const signed char Done = 10; const signed char InpLt = 0; // < const signed char InpQm = 1; // ? const signed char InpEm = 2; // ! const signed char InpDash = 3; // - const signed char InpA = 4; // A const signed char InpE = 5; // E const signed char InpL = 6; // L const signed char InpN = 7; // N const signed char InpUnknown = 8; // use some kind of state machine for parsing static const signed char table[4][9] = { /* InpLt InpQm InpEm InpDash InpA InpE InpL InpN InpUnknown */ { Lt, -1, -1, -1, -1, -1, -1, -1, -1 }, // Init { -1, Qm, Em, -1, -1, -1, -1, -1, -1 }, // Lt { -1, -1, -1, Dash, CA, CE, -1, CN, -1 }, // Em { -1, -1, -1, -1, -1, -1, CEL, CEN, -1 } // CE }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == '<' ) { input = InpLt; } else if ( c == '?' ) { input = InpQm; } else if ( c == '!' ) { input = InpEm; } else if ( c == '-' ) { input = InpDash; } else if ( c == 'A' ) { input = InpA; } else if ( c == 'E' ) { input = InpE; } else if ( c == 'L' ) { input = InpL; } else if ( c == 'N' ) { input = InpN; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Lt: next(); break; case Em: next(); break; case CE: next(); break; case Qm: parseOk = parsePI(); break; case Dash: parseOk = parseComment(); break; case CA: parseOk = parseAttlistDecl(); break; case CEL: parseOk = parseElementDecl(); break; case CEN: parseOk = parseEntityDecl(); break; case CN: parseOk = parseNotationDecl(); break; } // no input is read after this switch ( state ) { case Qm: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGPI; goto parseError; } if ( contentHnd ) { if ( !contentHnd->processingInstruction(name(),string()) ) { d->error = contentHnd->errorString(); goto parseError; } } return TRUE; case Dash: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCOMMENT; goto parseError; } if ( lexicalHnd ) { if ( !lexicalHnd->comment( string() ) ) { d->error = lexicalHnd->errorString(); goto parseError; } } return TRUE; case CA: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGATTLISTDECL; goto parseError; } return TRUE; case CEL: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGELEMENTDECL; goto parseError; } return TRUE; case CEN: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGENTITYDECL; goto parseError; } return TRUE; case CN: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNOTATIONDECL; goto parseError; } return TRUE; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a PEReference [69] */ bool QXmlSimpleReader::parsePEReference( EntityRecognitionContext context ) { const signed char Init = 0; const signed char Next = 1; const signed char Name = 2; const signed char Done = 3; const signed char InpSemi = 0; // ; const signed char InpPer = 1; // % const signed char InpUnknown = 2; // use some kind of state machine for parsing static const signed char table[3][3] = { /* InpSemi InpPer InpUnknown */ { -1, Next, -1 }, // Init { -1, -1, Name }, // Next { Done, -1, -1 } // Name }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == ';' ) { input = InpSemi; } else if ( c == '%' ) { input = InpPer; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Next: next(); break; case Name: parseOk = parseName( TRUE ); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Name: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } if ( d->parameterEntities.find( ref() ) == d->parameterEntities.end() ) { // ### skip it??? if ( contentHnd ) { if ( !contentHnd->skippedEntity( QString("%") + ref() ) ) { d->error = contentHnd->errorString(); goto parseError; } } } else { if ( context == InEntityValue ) { // Included in literal xmlRef = d->parameterEntities.find( ref() ) .data().replace( QRegExp("\""), """ ).replace( QRegExp("'"), "'" ) + xmlRef; } else if ( context == InDTD ) { // Included as PE xmlRef = QString(" ") + d->parameterEntities.find( ref() ).data() + QString(" ") + xmlRef; } } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a AttlistDecl [52]. Precondition: the beginning '<!' is already read and the head stands on the 'A' of '<!ATTLIST' */ bool QXmlSimpleReader::parseAttlistDecl() { const signed char Init = 0; const signed char Attlist = 1; // parse the string "ATTLIST" const signed char Ws = 2; // whitespace read const signed char Name = 3; // parse name const signed char Ws1 = 4; // whitespace read const signed char Attdef = 5; // parse the AttDef const signed char Ws2 = 6; // whitespace read const signed char Atttype = 7; // parse the AttType const signed char Ws3 = 8; // whitespace read const signed char DDecH = 9; // DefaultDecl with # const signed char DefReq = 10; // parse the string "REQUIRED" const signed char DefImp = 11; // parse the string "IMPLIED" const signed char DefFix = 12; // parse the string "FIXED" const signed char Attval = 13; // parse the AttValue const signed char Ws4 = 14; // whitespace read const signed char Done = 15; const signed char InpWs = 0; // white space const signed char InpGt = 1; // > const signed char InpHash = 2; // # const signed char InpA = 3; // A const signed char InpI = 4; // I const signed char InpF = 5; // F const signed char InpR = 6; // R const signed char InpUnknown = 7; // use some kind of state machine for parsing static const signed char table[15][8] = { /* InpWs InpGt InpHash InpA InpI InpF InpR InpUnknown */ { -1, -1, -1, Attlist, -1, -1, -1, -1 }, // Init { Ws, -1, -1, -1, -1, -1, -1, -1 }, // Attlist { -1, -1, -1, Name, Name, Name, Name, Name }, // Ws { Ws1, Done, Attdef, Attdef, Attdef, Attdef, Attdef, Attdef }, // Name { -1, Done, Attdef, Attdef, Attdef, Attdef, Attdef, Attdef }, // Ws1 { Ws2, -1, -1, -1, -1, -1, -1, -1 }, // Attdef { -1, Atttype, Atttype, Atttype, Atttype, Atttype, Atttype, Atttype }, // Ws2 { Ws3, -1, -1, -1, -1, -1, -1, -1 }, // Attype { -1, Attval, DDecH, Attval, Attval, Attval, Attval, Attval }, // Ws3 { -1, -1, -1, -1, DefImp, DefFix, DefReq, -1 }, // DDecH { Ws4, Ws4, -1, -1, -1, -1, -1, -1 }, // DefReq { Ws4, Ws4, -1, -1, -1, -1, -1, -1 }, // DefImp { Ws3, -1, -1, -1, -1, -1, -1, -1 }, // DefFix { Ws4, Ws4, -1, -1, -1, -1, -1, -1 }, // Attval { -1, Done, Attdef, Attdef, Attdef, Attdef, Attdef, Attdef } // Ws4 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '>' ) { input = InpGt; } else if ( c == '#' ) { input = InpHash; } else if ( c == 'A' ) { input = InpA; } else if ( c == 'I' ) { input = InpI; } else if ( c == 'F' ) { input = InpF; } else if ( c == 'R' ) { input = InpR; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Attlist: parseOk = parseString( "ATTLIST" ); break; case Ws: case Ws1: case Ws2: case Ws3: eat_ws(); break; case Name: parseOk = parseName(); break; case Attdef: parseOk = parseName(); break; case Atttype: parseOk = parseAttType(); break; case DDecH: next(); break; case DefReq: parseOk = parseString( "REQUIRED" ); break; case DefImp: parseOk = parseString( "IMPLIED" ); break; case DefFix: parseOk = parseString( "FIXED" ); break; case Attval: parseOk = parseAttValue(); break; case Ws4: if ( declHnd ) { // TODO: not all values are computed yet... if ( !declHnd->attributeDecl( d->attDeclEName, d->attDeclAName, "", "", "" ) ) { d->error = declHnd->errorString(); goto parseError; } } eat_ws(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Attlist: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Name: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } d->attDeclEName = name(); break; case Attdef: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } d->attDeclAName = name(); break; case Atttype: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGATTTYPE; goto parseError; } break; case DefReq: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case DefImp: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case DefFix: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Attval: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGATTVALUE; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a AttType [54] */ bool QXmlSimpleReader::parseAttType() { const signed char Init = 0; const signed char ST = 1; // StringType const signed char TTI = 2; // TokenizedType starting with 'I' const signed char TTI2 = 3; // TokenizedType helpstate const signed char TTI3 = 4; // TokenizedType helpstate const signed char TTE = 5; // TokenizedType starting with 'E' const signed char TTEY = 6; // TokenizedType starting with 'ENTITY' const signed char TTEI = 7; // TokenizedType starting with 'ENTITI' const signed char N = 8; // N read (TokenizedType or Notation) const signed char TTNM = 9; // TokenizedType starting with 'NM' const signed char TTNM2 = 10; // TokenizedType helpstate const signed char NO = 11; // Notation const signed char NO2 = 12; // Notation helpstate const signed char NO3 = 13; // Notation helpstate const signed char NOName = 14; // Notation, read name const signed char NO4 = 15; // Notation helpstate const signed char EN = 16; // Enumeration const signed char ENNmt = 17; // Enumeration, read Nmtoken const signed char EN2 = 18; // Enumeration helpstate const signed char ADone = 19; // almost done (make next and accept) const signed char Done = 20; const signed char InpWs = 0; // whitespace const signed char InpOp = 1; // ( const signed char InpCp = 2; // ) const signed char InpPipe = 3; // | const signed char InpC = 4; // C const signed char InpE = 5; // E const signed char InpI = 6; // I const signed char InpM = 7; // M const signed char InpN = 8; // N const signed char InpO = 9; // O const signed char InpR = 10; // R const signed char InpS = 11; // S const signed char InpY = 12; // Y const signed char InpUnknown = 13; // use some kind of state machine for parsing static const signed char table[19][14] = { /* InpWs InpOp InpCp InpPipe InpC InpE InpI InpM InpN InpO InpR InpS InpY InpUnknown */ { -1, EN, -1, -1, ST, TTE, TTI, -1, N, -1, -1, -1, -1, -1 }, // Init { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done }, // ST { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, TTI2, Done, Done, Done }, // TTI { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, TTI3, Done, Done }, // TTI2 { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done }, // TTI3 { -1, -1, -1, -1, -1, -1, TTEI, -1, -1, -1, -1, -1, TTEY, -1 }, // TTE { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done }, // TTEY { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done }, // TTEI { -1, -1, -1, -1, -1, -1, -1, TTNM, -1, NO, -1, -1, -1, -1 }, // N { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, TTNM2, Done, Done }, // TTNM { Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done, Done }, // TTNM2 { NO2, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // NO { -1, NO3, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // NO2 { NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName, NOName }, // NO3 { NO4, -1, ADone, NO3, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // NOName { -1, -1, ADone, NO3, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // NO4 { -1, -1, ENNmt, -1, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt, ENNmt }, // EN { EN2, -1, ADone, EN, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // ENNmt { -1, -1, ADone, EN, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 } // EN2 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '(' ) { input = InpOp; } else if ( c == ')' ) { input = InpCp; } else if ( c == '|' ) { input = InpPipe; } else if ( c == 'C' ) { input = InpC; } else if ( c == 'E' ) { input = InpE; } else if ( c == 'I' ) { input = InpI; } else if ( c == 'M' ) { input = InpM; } else if ( c == 'N' ) { input = InpN; } else if ( c == 'O' ) { input = InpO; } else if ( c == 'R' ) { input = InpR; } else if ( c == 'S' ) { input = InpS; } else if ( c == 'Y' ) { input = InpY; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case ST: parseOk = parseString( "CDATA" ); break; case TTI: parseOk = parseString( "ID" ); break; case TTI2: parseOk = parseString( "REF" ); break; case TTI3: next(); // S break; case TTE: parseOk = parseString( "ENTIT" ); break; case TTEY: next(); // Y break; case TTEI: parseOk = parseString( "IES" ); break; case N: next(); // N break; case TTNM: parseOk = parseString( "MTOKEN" ); break; case TTNM2: next(); // S break; case NO: parseOk = parseString( "OTATION" ); break; case NO2: eat_ws(); break; case NO3: next_eat_ws(); break; case NOName: parseOk = parseName(); break; case NO4: eat_ws(); break; case EN: next_eat_ws(); break; case ENNmt: parseOk = parseNmtoken(); break; case EN2: eat_ws(); break; case ADone: next(); break; } // no input is read after this switch ( state ) { case ST: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case TTI: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case TTI2: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case TTE: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case TTEI: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case TTNM: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case NO: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case NOName: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case ENNmt: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNMTOKEN; goto parseError; } break; case ADone: return TRUE; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a AttValue [10] Precondition: the head stands on the beginning " or ' If this function was successful, the head stands on the first character after the closing " or ' and the value of the attribute is in string(). */ bool QXmlSimpleReader::parseAttValue() { bool tmp; const signed char Init = 0; const signed char Dq = 1; // double quotes were read const signed char DqRef = 2; // read references in double quotes const signed char DqC = 3; // signed character read in double quotes const signed char Sq = 4; // single quotes were read const signed char SqRef = 5; // read references in single quotes const signed char SqC = 6; // signed character read in single quotes const signed char Done = 7; const signed char InpDq = 0; // " const signed char InpSq = 1; // ' const signed char InpAmp = 2; // & const signed char InpLt = 3; // < const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[7][5] = { /* InpDq InpSq InpAmp InpLt InpUnknown */ { Dq, Sq, -1, -1, -1 }, // Init { Done, DqC, DqRef, -1, DqC }, // Dq { Done, DqC, DqRef, -1, DqC }, // DqRef { Done, DqC, DqRef, -1, DqC }, // DqC { SqC, Done, SqRef, -1, SqC }, // Sq { SqC, Done, SqRef, -1, SqC }, // SqRef { SqC, Done, SqRef, -1, SqC } // SqRef }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == '"' ) { input = InpDq; } else if ( c == '\'' ) { input = InpSq; } else if ( c == '&' ) { input = InpAmp; } else if ( c == '<' ) { input = InpLt; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Dq: case Sq: stringClear(); next(); break; case DqRef: case SqRef: parseOk = parseReference( tmp, InAttributeValue ); break; case DqC: case SqC: stringAddC(); next(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case DqRef: case SqRef: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a elementdecl [45]. Precondition: the beginning '<!E' is already read and the head stands on the 'L' of '<!ELEMENT' */ bool QXmlSimpleReader::parseElementDecl() { const signed char Init = 0; const signed char Elem = 1; // parse the beginning string const signed char Ws1 = 2; // whitespace required const signed char Nam = 3; // parse Name const signed char Ws2 = 4; // whitespace required const signed char Empty = 5; // read EMPTY const signed char Any = 6; // read ANY const signed char Cont = 7; // read contentspec (except ANY or EMPTY) const signed char Mix = 8; // read Mixed const signed char Mix2 = 9; // const signed char Mix3 = 10; // const signed char MixN1 = 11; // const signed char MixN2 = 12; // const signed char MixN3 = 13; // const signed char MixN4 = 14; // const signed char Cp = 15; // parse cp const signed char Cp2 = 16; // const signed char WsD = 17; // eat whitespace before Done const signed char Done = 18; const signed char InpWs = 0; const signed char InpGt = 1; // > const signed char InpPipe = 2; // | const signed char InpOp = 3; // ( const signed char InpCp = 4; // ) const signed char InpHash = 5; // # const signed char InpQm = 6; // ? const signed char InpAst = 7; // * const signed char InpPlus = 8; // + const signed char InpA = 9; // A const signed char InpE = 10; // E const signed char InpL = 11; // L const signed char InpUnknown = 12; // use some kind of state machine for parsing static const signed char table[18][13] = { /* InpWs InpGt InpPipe InpOp InpCp InpHash InpQm InpAst InpPlus InpA InpE InpL InpUnknown */ { -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, Elem, -1 }, // Init { Ws1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // Elem { -1, -1, -1, -1, -1, -1, -1, -1, -1, Nam, Nam, Nam, Nam }, // Ws1 { Ws2, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // Nam { -1, -1, -1, Cont, -1, -1, -1, -1, -1, Any, Empty, -1, -1 }, // Ws2 { WsD, Done, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // Empty { WsD, Done, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // Any { -1, -1, -1, Cp, Cp, Mix, -1, -1, -1, Cp, Cp, Cp, Cp }, // Cont { Mix2, -1, MixN1, -1, Mix3, -1, -1, -1, -1, -1, -1, -1, -1 }, // Mix { -1, -1, MixN1, -1, Mix3, -1, -1, -1, -1, -1, -1, -1, -1 }, // Mix2 { WsD, Done, -1, -1, -1, -1, -1, WsD, -1, -1, -1, -1, -1 }, // Mix3 { -1, -1, -1, -1, -1, -1, -1, -1, -1, MixN2, MixN2, MixN2, MixN2 }, // MixN1 { MixN3, -1, MixN1, -1, MixN4, -1, -1, -1, -1, -1, -1, -1, -1 }, // MixN2 { -1, -1, MixN1, -1, MixN4, -1, -1, -1, -1, -1, -1, -1, -1 }, // MixN3 { -1, -1, -1, -1, -1, -1, -1, WsD, -1, -1, -1, -1, -1 }, // MixN4 { WsD, Done, -1, -1, -1, -1, Cp2, Cp2, Cp2, -1, -1, -1, -1 }, // Cp { WsD, Done, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 }, // Cp2 { -1, Done, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 } // WsD }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // read input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '>' ) { input = InpGt; } else if ( c == '|' ) { input = InpPipe; } else if ( c == '(' ) { input = InpOp; } else if ( c == ')' ) { input = InpCp; } else if ( c == '#' ) { input = InpHash; } else if ( c == '?' ) { input = InpQm; } else if ( c == '*' ) { input = InpAst; } else if ( c == '+' ) { input = InpPlus; } else if ( c == 'A' ) { input = InpA; } else if ( c == 'E' ) { input = InpE; } else if ( c == 'L' ) { input = InpL; } else { input = InpUnknown; } // get new state //qDebug( "%d -%d(%c)-> %d", state, input, c.latin1(), table[state][input] ); state = table[state][input]; // in some cases do special actions depending on state switch ( state ) { case Elem: parseOk = parseString( "LEMENT" ); break; case Ws1: eat_ws(); break; case Nam: parseOk = parseName(); break; case Ws2: eat_ws(); break; case Empty: parseOk = parseString( "EMPTY" ); break; case Any: parseOk = parseString( "ANY" ); break; case Cont: next_eat_ws(); break; case Mix: parseOk = parseString( "#PCDATA" ); break; case Mix2: eat_ws(); break; case Mix3: next(); break; case MixN1: next_eat_ws(); break; case MixN2: parseOk = parseName(); break; case MixN3: eat_ws(); break; case MixN4: next(); break; case Cp: parseOk = parseChoiceSeq(); break; case Cp2: next(); break; case WsD: next_eat_ws(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Elem: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Nam: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case Empty: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Any: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Mix: if( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case MixN2: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case Cp: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCHOICE; goto parseError; } break; case Done: return TRUE; case -1: d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a NotationDecl [82]. Precondition: the beginning '<!' is already read and the head stands on the 'N' of '<!NOTATION' */ bool QXmlSimpleReader::parseNotationDecl() { const signed char Init = 0; const signed char Not = 1; // read NOTATION const signed char Ws1 = 2; // eat whitespaces const signed char Nam = 3; // read Name const signed char Ws2 = 4; // eat whitespaces const signed char ExtID = 5; // parse ExternalID const signed char Ws3 = 6; // eat whitespaces const signed char Done = 7; const signed char InpWs = 0; const signed char InpGt = 1; // > const signed char InpN = 2; // N const signed char InpUnknown = 3; // use some kind of state machine for parsing static const signed char table[7][4] = { /* InpWs InpGt InpN InpUnknown */ { -1, -1, Not, -1 }, // Init { Ws1, -1, -1, -1 }, // Not { -1, -1, Nam, Nam }, // Ws1 { Ws2, Done, -1, -1 }, // Nam { -1, Done, ExtID, ExtID }, // Ws2 { Ws3, Done, -1, -1 }, // ExtID { -1, Done, -1, -1 } // Ws3 }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '>' ) { input = InpGt; } else if ( c == 'N' ) { input = InpN; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Not: parseOk = parseString( "NOTATION" ); break; case Ws1: eat_ws(); break; case Nam: parseOk = parseName(); break; case Ws2: eat_ws(); break; case ExtID: parseOk = parseExternalID( TRUE ); break; case Ws3: eat_ws(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Not: if ( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Nam: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case ExtID: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGEXTERNALID; goto parseError; } // call the handler if ( dtdHnd ) { if ( !dtdHnd->notationDecl( name(), d->publicId, d->systemId ) ) { d->error = dtdHnd->errorString(); goto parseError; } } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse choice [49] or seq [50]. Precondition: the beginning '('S? is already read and the head stands on the first non-whitespace character after it. */ bool QXmlSimpleReader::parseChoiceSeq() { const signed char Init = 0; const signed char Ws1 = 1; // eat whitespace const signed char CS = 2; // choice or set const signed char Ws2 = 3; // eat whitespace const signed char More = 4; // more cp to read const signed char Name = 5; // read name const signed char Done = 6; // const signed char InpWs = 0; // S const signed char InpOp = 1; // ( const signed char InpCp = 2; // ) const signed char InpQm = 3; // ? const signed char InpAst = 4; // * const signed char InpPlus = 5; // + const signed char InpPipe = 6; // | const signed char InpComm = 7; // , const signed char InpUnknown = 8; // use some kind of state machine for parsing static const signed char table[6][9] = { /* InpWs InpOp InpCp InpQm InpAst InpPlus InpPipe InpComm InpUnknown */ { -1, Ws1, -1, -1, -1, -1, -1, -1, Name }, // Init { -1, CS, -1, -1, -1, -1, -1, -1, CS }, // Ws1 { Ws2, -1, Done, Ws2, Ws2, Ws2, More, More, -1 }, // CS { -1, -1, Done, -1, -1, -1, More, More, -1 }, // Ws2 { -1, Ws1, -1, -1, -1, -1, -1, -1, Name }, // More (same as Init) { Ws2, -1, Done, Ws2, Ws2, Ws2, More, More, -1 } // Name (same as CS) }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '(' ) { input = InpOp; } else if ( c == ')' ) { input = InpCp; } else if ( c == '?' ) { input = InpQm; } else if ( c == '*' ) { input = InpAst; } else if ( c == '+' ) { input = InpPlus; } else if ( c == '|' ) { input = InpPipe; } else if ( c == ',' ) { input = InpComm; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Ws1: next_eat_ws(); break; case CS: parseOk = parseChoiceSeq(); break; case Ws2: next_eat_ws(); break; case More: next_eat_ws(); break; case Name: parseOk = parseName(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case CS: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGCHOICE; goto parseError; } break; case Name: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a EntityDecl [70]. Precondition: the beginning '<!E' is already read and the head stand on the 'N' of '<!ENTITY' */ bool QXmlSimpleReader::parseEntityDecl() { const signed char Init = 0; const signed char Ent = 1; // parse "ENTITY" const signed char Ws1 = 2; // white space read const signed char Name = 3; // parse name const signed char Ws2 = 4; // white space read const signed char EValue = 5; // parse entity value const signed char ExtID = 6; // parse ExternalID const signed char Ws3 = 7; // white space read const signed char Ndata = 8; // parse "NDATA" const signed char Ws4 = 9; // white space read const signed char NNam = 10; // parse name const signed char PEDec = 11; // parse PEDecl const signed char Ws6 = 12; // white space read const signed char PENam = 13; // parse name const signed char Ws7 = 14; // white space read const signed char PEVal = 15; // parse entity value const signed char PEEID = 16; // parse ExternalID const signed char WsE = 17; // white space read const signed char EDDone = 19; // done, but also report an external, unparsed entity decl const signed char Done = 18; const signed char InpWs = 0; // white space const signed char InpPer = 1; // % const signed char InpQuot = 2; // " or ' const signed char InpGt = 3; // > const signed char InpN = 4; // N const signed char InpUnknown = 5; // use some kind of state machine for parsing static const signed char table[18][6] = { /* InpWs InpPer InpQuot InpGt InpN InpUnknown */ { -1, -1, -1, -1, Ent, -1 }, // Init { Ws1, -1, -1, -1, -1, -1 }, // Ent { -1, PEDec, -1, -1, Name, Name }, // Ws1 { Ws2, -1, -1, -1, -1, -1 }, // Name { -1, -1, EValue, -1, -1, ExtID }, // Ws2 { WsE, -1, -1, Done, -1, -1 }, // EValue { Ws3, -1, -1, EDDone,-1, -1 }, // ExtID { -1, -1, -1, EDDone,Ndata, -1 }, // Ws3 { Ws4, -1, -1, -1, -1, -1 }, // Ndata { -1, -1, -1, -1, NNam, NNam }, // Ws4 { WsE, -1, -1, Done, -1, -1 }, // NNam { Ws6, -1, -1, -1, -1, -1 }, // PEDec { -1, -1, -1, -1, PENam, PENam }, // Ws6 { Ws7, -1, -1, -1, -1, -1 }, // PENam { -1, -1, PEVal, -1, -1, PEEID }, // Ws7 { WsE, -1, -1, Done, -1, -1 }, // PEVal { WsE, -1, -1, Done, -1, -1 }, // PEEID { -1, -1, -1, Done, -1, -1 } // WsE }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_S(c) ) { input = InpWs; } else if ( c == '%' ) { input = InpPer; } else if ( c == '"' || c == '\'' ) { input = InpQuot; } else if ( c == '>' ) { input = InpGt; } else if ( c == 'N' ) { input = InpN; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Ent: parseOk = parseString( "NTITY" ); break; case Ws1: eat_ws(); break; case Name: parseOk = parseName(); break; case Ws2: eat_ws(); break; case EValue: parseOk = parseEntityValue(); break; case ExtID: parseOk = parseExternalID(); break; case Ws3: eat_ws(); break; case Ndata: parseOk = parseString( "NDATA" ); break; case Ws4: eat_ws(); break; case NNam: parseOk = parseName( TRUE ); break; case PEDec: next(); break; case Ws6: eat_ws(); break; case PENam: parseOk = parseName(); break; case Ws7: eat_ws(); break; case PEVal: parseOk = parseEntityValue(); break; case PEEID: parseOk = parseExternalID(); break; case WsE: eat_ws(); break; case EDDone: next(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Ent: if ( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case Name: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case EValue: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGENTITYVALUE; goto parseError; } if ( !entityExist( name() ) ) { d->entities.insert( name(), string() ); if ( declHnd ) { if ( !declHnd->internalEntityDecl( name(), string() ) ) { d->error = declHnd->errorString(); goto parseError; } } } break; case ExtID: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGEXTERNALID; goto parseError; } break; case Ndata: if ( !parseOk ) { d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } break; case NNam: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } if ( !entityExist( name() ) ) { d->externEntities.insert( name(), QXmlSimpleReaderPrivate::ExternEntity( d->publicId, d->systemId, ref() ) ); if ( dtdHnd ) { if ( !dtdHnd->unparsedEntityDecl( name(), d->publicId, d->systemId, ref() ) ) { d->error = declHnd->errorString(); goto parseError; } } } break; case PENam: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case PEVal: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGENTITYVALUE; goto parseError; } if ( !entityExist( name() ) ) { d->parameterEntities.insert( name(), string() ); if ( declHnd ) { if ( !declHnd->internalEntityDecl( QString("%")+name(), string() ) ) { d->error = declHnd->errorString(); goto parseError; } } } break; case PEEID: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGEXTERNALID; goto parseError; } if ( !entityExist( name() ) ) { d->externParameterEntities.insert( name(), QXmlSimpleReaderPrivate::ExternParameterEntity( d->publicId, d->systemId ) ); if ( declHnd ) { if ( !declHnd->externalEntityDecl( QString("%")+name(), d->publicId, d->systemId ) ) { d->error = declHnd->errorString(); goto parseError; } } } break; case EDDone: if ( !entityExist( name() ) ) { d->externEntities.insert( name(), QXmlSimpleReaderPrivate::ExternEntity( d->publicId, d->systemId, QString::null ) ); if ( declHnd ) { if ( !declHnd->externalEntityDecl( name(), d->publicId, d->systemId ) ) { d->error = declHnd->errorString(); goto parseError; } } } return TRUE; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a EntityValue [9] */ bool QXmlSimpleReader::parseEntityValue() { bool tmp; const signed char Init = 0; const signed char Dq = 1; // EntityValue is double quoted const signed char DqC = 2; // signed character const signed char DqPER = 3; // PERefence const signed char DqRef = 4; // Reference const signed char Sq = 5; // EntityValue is double quoted const signed char SqC = 6; // signed character const signed char SqPER = 7; // PERefence const signed char SqRef = 8; // Reference const signed char Done = 9; const signed char InpDq = 0; // " const signed char InpSq = 1; // ' const signed char InpAmp = 2; // & const signed char InpPer = 3; // % const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[9][5] = { /* InpDq InpSq InpAmp InpPer InpUnknown */ { Dq, Sq, -1, -1, -1 }, // Init { Done, DqC, DqRef, DqPER, DqC }, // Dq { Done, DqC, DqRef, DqPER, DqC }, // DqC { Done, DqC, DqRef, DqPER, DqC }, // DqPER { Done, DqC, DqRef, DqPER, DqC }, // DqRef { SqC, Done, SqRef, SqPER, SqC }, // Sq { SqC, Done, SqRef, SqPER, SqC }, // SqC { SqC, Done, SqRef, SqPER, SqC }, // SqPER { SqC, Done, SqRef, SqPER, SqC } // SqRef }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == '"' ) { input = InpDq; } else if ( c == '\'' ) { input = InpSq; } else if ( c == '&' ) { input = InpAmp; } else if ( c == '%' ) { input = InpPer; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Dq: case Sq: stringClear(); next(); break; case DqC: case SqC: stringAddC(); next(); break; case DqPER: case SqPER: parseOk = parsePEReference( InEntityValue ); break; case DqRef: case SqRef: parseOk = parseReference( tmp, InEntityValue ); break; case Done: next(); break; } // no input is read after this switch ( state ) { case DqPER: case SqPER: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGDOCTYPE; goto parseError; } break; case DqRef: case SqRef: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a comment [15]. Precondition: the beginning '<!' of the comment is already read and the head stands on the first '-' of '<!--'. If this funktion was successful, the head-position is on the first character after the comment. */ bool QXmlSimpleReader::parseComment() { const signed char Init = 0; const signed char Dash1 = 1; // the first dash was read const signed char Dash2 = 2; // the second dash was read const signed char Com = 3; // read comment const signed char Com2 = 4; // read comment (help state) const signed char ComE = 5; // finished reading comment const signed char Done = 6; const signed char InpDash = 0; // - const signed char InpGt = 1; // > const signed char InpUnknown = 2; // use some kind of state machine for parsing static const signed char table[6][3] = { /* InpDash InpGt InpUnknown */ { Dash1, -1, -1 }, // Init { Dash2, -1, -1 }, // Dash1 { Com2, Com, Com }, // Dash2 { Com2, Com, Com }, // Com { ComE, Com, Com }, // Com2 { -1, Done, -1 } // ComE }; signed char state = Init; signed char input; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == '-' ) { input = InpDash; } else if ( c == '>' ) { input = InpGt; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Dash1: next(); break; case Dash2: next(); break; case Com: stringAddC(); next(); break; case Com2: next(); break; case ComE: next(); break; case Done: next(); break; } // no input is read after this switch ( state ) { case Dash2: stringClear(); break; case Com2: // if next character is not a dash than don't skip it if ( c != '-' ) { stringAddC( '-' ); } break; case Done: return TRUE; case -1: // Error d->error = XMLERR_ERRORPARSINGCOMMENT; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a Attribute [41]. Precondition: the head stands on the first character of the name of the attribute (i.e. all whitespaces are already parsed). The head stand on the next character after the end quotes. The variable name contains the name of the attribute and the variable string contains the value of the attribute. */ bool QXmlSimpleReader::parseAttribute() { const signed char Init = 0; const signed char PName = 1; // parse name const signed char Ws = 2; // eat ws const signed char Eq = 3; // the '=' was read const signed char Quotes = 4; // " or ' were read const signed char InpNameBe = 0; const signed char InpEq = 1; // = const signed char InpDq = 2; // " const signed char InpSq = 3; // ' const signed char InpUnknown = 4; // use some kind of state machine for parsing static const signed char table[4][5] = { /* InpNameBe InpEq InpDq InpSq InpUnknown */ { PName, -1, -1, -1, -1 }, // Init { -1, Eq, -1, -1, Ws }, // PName { -1, Eq, -1, -1, -1 }, // Ws { -1, -1, Quotes, Quotes, -1 } // Eq }; signed char state = Init; signed char input; bool parseOk = TRUE; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_NameBeginning(c) ) { input = InpNameBe; } else if ( c == '=' ) { input = InpEq; } else if ( c == '"' ) { input = InpDq; } else if ( c == '\'' ) { input = InpSq; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case PName: parseOk = parseName(); break; case Ws: eat_ws(); break; case Eq: next_eat_ws(); break; case Quotes: parseOk = parseAttValue(); break; } // no input is read after this switch ( state ) { case PName: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGNAME; goto parseError; } break; case Quotes: if ( !parseOk ) { d->error = XMLERR_ERRORPARSINGATTVALUE; goto parseError; } // Done return TRUE; case -1: // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a Name [5] and store the name in name or ref (if useRef is TRUE). */ bool QXmlSimpleReader::parseName( bool useRef ) { const signed char Init = 0; const signed char Name1 = 1; // parse first signed character of the name const signed char Name = 2; // parse name const signed char Done = 3; const signed char InpNameBe = 0; // name beginning signed characters const signed char InpNameCh = 1; // NameChar without InpNameBe const signed char InpUnknown = 2; // use some kind of state machine for parsing static const signed char table[3][3] = { /* InpNameBe InpNameCh InpUnknown */ { Name1, -1, -1 }, // Init { Name, Name, Done }, // Name1 { Name, Name, Done } // Name }; signed char state = Init; signed char input; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_NameBeginning(c) ) { input = InpNameBe; } else if ( is_NameChar(c) ) { input = InpNameCh; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case Name1: if ( useRef ) { refClear(); refAddC(); } else { nameClear(); nameAddC(); } next(); break; case Name: if ( useRef ) { refAddC(); } else { nameAddC(); } next(); break; } // no input is read after this switch ( state ) { case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a Nmtoken [7] and store the name in name. */ bool QXmlSimpleReader::parseNmtoken() { const signed char Init = 0; const signed char NameF = 1; const signed char Name = 2; const signed char Done = 3; const signed char InpNameCh = 0; // NameChar without InpNameBe const signed char InpUnknown = 1; // use some kind of state machine for parsing static const signed char table[3][2] = { /* InpNameCh InpUnknown */ { NameF, -1 }, // Init { Name, Done }, // NameF { Name, Done } // Name }; signed char state = Init; signed char input; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( is_NameChar(c) ) { input = InpNameCh; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case NameF: nameClear(); nameAddC(); next(); break; case Name: nameAddC(); next(); break; } // no input is read after this switch ( state ) { case Done: return TRUE; case -1: // Error d->error = XMLERR_LETTEREXPECTED; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Parse a Reference [67]. charDataRead is set to TRUE if the reference must not be parsed. The character(s) which the reference mapped to are appended to string. The head stands on the first character after the reference. charDataRead is set to FALSE if the reference must be parsed. The charachter(s) which the reference mapped to are inserted at the reference position. The head stands on the first character of the replacement). */ bool QXmlSimpleReader::parseReference( bool &charDataRead, EntityRecognitionContext context ) { // temporary variables uint tmp; bool ok; const signed char Init = 0; const signed char SRef = 1; // start of a reference const signed char ChRef = 2; // parse CharRef const signed char ChDec = 3; // parse CharRef decimal const signed char ChHexS = 4; // start CharRef hexadecimal const signed char ChHex = 5; // parse CharRef hexadecimal const signed char Name = 6; // parse name const signed char DoneD = 7; // done CharRef decimal const signed char DoneH = 8; // done CharRef hexadecimal const signed char DoneN = 9; // done EntityRef const signed char InpAmp = 0; // & const signed char InpSemi = 1; // ; const signed char InpHash = 2; // # const signed char InpX = 3; // x const signed char InpNum = 4; // 0-9 const signed char InpHex = 5; // a-f A-F const signed char InpUnknown = 6; // use some kind of state machine for parsing static const signed char table[8][7] = { /* InpAmp InpSemi InpHash InpX InpNum InpHex InpUnknown */ { SRef, -1, -1, -1, -1, -1, -1 }, // Init { -1, -1, ChRef, Name, Name, Name, Name }, // SRef { -1, -1, -1, ChHexS, ChDec, -1, -1 }, // ChRef { -1, DoneD, -1, -1, ChDec, -1, -1 }, // ChDec { -1, -1, -1, -1, ChHex, ChHex, -1 }, // ChHexS { -1, DoneH, -1, -1, ChHex, ChHex, -1 }, // ChHex { -1, DoneN, -1, -1, -1, -1, -1 } // Name }; signed char state = Init; signed char input; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c.row() ) { input = InpUnknown; } else if ( c.cell() == '&' ) { input = InpAmp; } else if ( c.cell() == ';' ) { input = InpSemi; } else if ( c.cell() == '#' ) { input = InpHash; } else if ( c.cell() == 'x' ) { input = InpX; } else if ( '0' <= c.cell() && c.cell() <= '9' ) { input = InpNum; } else if ( 'a' <= c.cell() && c.cell() <= 'f' ) { input = InpHex; } else if ( 'A' <= c.cell() && c.cell() <= 'F' ) { input = InpHex; } else { input = InpUnknown; } // set state according to input state = table[state][input]; // do some actions according to state switch ( state ) { case SRef: refClear(); next(); break; case ChRef: next(); break; case ChDec: refAddC(); next(); break; case ChHexS: next(); break; case ChHex: refAddC(); next(); break; case Name: // read the name into the ref parseName( TRUE ); break; case DoneD: tmp = ref().toUInt( &ok, 10 ); if ( ok ) { stringAddC( QChar(tmp) ); } else { d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } charDataRead = TRUE; next(); break; case DoneH: tmp = ref().toUInt( &ok, 16 ); if ( ok ) { stringAddC( QChar(tmp) ); } else { d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } charDataRead = TRUE; next(); break; case DoneN: if ( !processReference( charDataRead, context ) ) goto parseError; next(); break; } // no input is read after this switch ( state ) { case DoneD: return TRUE; case DoneH: return TRUE; case DoneN: return TRUE; case -1: // Error d->error = XMLERR_ERRORPARSINGREFERENCE; goto parseError; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Helper function for parseReference() */ bool QXmlSimpleReader::processReference( bool &charDataRead, EntityRecognitionContext context ) { QString reference = ref(); if ( reference == "amp" ) { if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); stringAddC( 'a' ); stringAddC( 'm' ); stringAddC( 'p' ); stringAddC( ';' ); } else { // Included or Included in literal stringAddC( '&' ); } charDataRead = TRUE; } else if ( reference == "lt" ) { if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); stringAddC( 'l' ); stringAddC( 't' ); stringAddC( ';' ); } else { // Included or Included in literal stringAddC( '<' ); } charDataRead = TRUE; } else if ( reference == "gt" ) { if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); stringAddC( 'g' ); stringAddC( 't' ); stringAddC( ';' ); } else { // Included or Included in literal stringAddC( '>' ); } charDataRead = TRUE; } else if ( reference == "apos" ) { if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); stringAddC( 'a' ); stringAddC( 'p' ); stringAddC( 'o' ); stringAddC( 's' ); stringAddC( ';' ); } else { // Included or Included in literal stringAddC( '\'' ); } charDataRead = TRUE; } else if ( reference == "quot" ) { if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); stringAddC( 'q' ); stringAddC( 'u' ); stringAddC( 'o' ); stringAddC( 't' ); stringAddC( ';' ); } else { // Included or Included in literal stringAddC( '"' ); } charDataRead = TRUE; } else { QMap<QString,QString>::Iterator it; it = d->entities.find( reference ); if ( it != d->entities.end() ) { // "Internal General" switch ( context ) { case InContent: // Included xmlRef = it.data() + xmlRef; charDataRead = FALSE; break; case InAttributeValue: // Included in literal xmlRef = it.data().replace( QRegExp("\""), """ ).replace( QRegExp("'"), "'" ) + xmlRef; charDataRead = FALSE; break; case InEntityValue: { // Bypassed stringAddC( '&' ); for ( int i=0; i<(int)reference.length(); i++ ) { stringAddC( reference[i] ); } stringAddC( ';'); charDataRead = TRUE; } break; case InDTD: // Forbidden d->error = XMLERR_INTERNALGENERALENTITYINDTD; charDataRead = FALSE; break; } } else { QMap<QString,QXmlSimpleReaderPrivate::ExternEntity>::Iterator itExtern; itExtern = d->externEntities.find( reference ); if ( itExtern == d->externEntities.end() ) { // entity not declared // ### check this case for conformance if ( context == InEntityValue ) { // Bypassed stringAddC( '&' ); for ( int i=0; i<(int)reference.length(); i++ ) { stringAddC( reference[i] ); } stringAddC( ';'); charDataRead = TRUE; } else { if ( contentHnd ) { if ( !contentHnd->skippedEntity( reference ) ) { d->error = contentHnd->errorString(); return FALSE; // error } } } } else if ( (*itExtern).notation.isNull() ) { // "External Parsed General" switch ( context ) { case InContent: // Included if validating if ( contentHnd ) { if ( !contentHnd->skippedEntity( reference ) ) { d->error = contentHnd->errorString(); return FALSE; // error } } charDataRead = FALSE; break; case InAttributeValue: // Forbidden d->error = XMLERR_EXTERNALGENERALENTITYINAV; charDataRead = FALSE; break; case InEntityValue: { // Bypassed stringAddC( '&' ); for ( int i=0; i<(int)reference.length(); i++ ) { stringAddC( reference[i] ); } stringAddC( ';'); charDataRead = TRUE; } break; case InDTD: // Forbidden d->error = XMLERR_EXTERNALGENERALENTITYINDTD; charDataRead = FALSE; break; } } else { // "Unparsed" // ### notify for "Occurs as Attribute Value" missing (but this is no refence, anyway) // Forbidden d->error = XMLERR_UNPARSEDENTITYREFERENCE; charDataRead = FALSE; return FALSE; // error } } } return TRUE; // no error } /*! Parse over a simple string. After the string was successfully parsed, the head is on the first character after the string. */ bool QXmlSimpleReader::parseString( const QString& s ) { signed char Done = s.length(); const signed char InpCharExpected = 0; // the character that was expected const signed char InpUnknown = 1; signed char state = 0; // state in this function is the position in the string s signed char input; for (;;) { // get input if ( atEnd() ) { d->error = XMLERR_UNEXPECTEDEOF; goto parseError; } if ( c == s[(int)state] ) { input = InpCharExpected; } else { input = InpUnknown; } // set state according to input if ( input == InpCharExpected ) { state++; } else { // Error d->error = XMLERR_UNEXPECTEDCHARACTER; goto parseError; } // do some actions according to state next(); // no input is read after this if ( state == Done ) { return TRUE; } } return TRUE; parseError: reportParseError(); return FALSE; } /*! Inits the data values. */ void QXmlSimpleReader::init( const QXmlInputSource& i ) { xml = i.data(); xmlLength = xml.length(); xmlRef = ""; d->externParameterEntities.clear(); d->parameterEntities.clear(); d->externEntities.clear(); d->entities.clear(); tags.clear(); d->doctype = ""; d->xmlVersion = ""; d->encoding = ""; d->standalone = QXmlSimpleReaderPrivate::Unknown; lineNr = 0; columnNr = -1; pos = 0; next(); d->error = XMLERR_OK; } /*! Returns TRUE if a entity with the name \a e exists, otherwise returns FALSE. */ bool QXmlSimpleReader::entityExist( const QString& e ) const { if ( d->parameterEntities.find(e) == d->parameterEntities.end() && d->externParameterEntities.find(e) == d->externParameterEntities.end() ) { return FALSE; } else { return TRUE; } } void QXmlSimpleReader::reportParseError() { if ( errorHnd ) errorHnd->fatalError( QXmlParseException( d->error, columnNr+1, lineNr+1 ) ); } //US #endif //QT_NO_XML