Mbed port of the Simple Plain Xml parser. See http://code.google.com/p/spxml/ for more details. This library uses less memory and is much better suited to streaming data than TinyXML (doesn\'t use as much C++ features, and especially works without streams). See http://mbed.org/users/hlipka/notebook/xml-parsing/ for usage examples.

Dependents:   spxmltest_weather VFD_fontx2_weather weather_LCD_display News_LCD_display ... more

Revision:
0:3fa97f2c0505
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/spxmlreader.cpp	Wed Nov 24 20:52:14 2010 +0000
@@ -0,0 +1,572 @@
+/*
+ * Copyright 2007 Stephen Liu
+ * LGPL, see http://code.google.com/p/spxml/
+ * For license terms, see the file COPYING along with this library.
+ */
+
+#include <string.h>
+#include <ctype.h>
+#include <stdlib.h>
+#include <typeinfo>
+
+#include "spxmlparser.hpp"
+#include "spxmlreader.hpp"
+#include "spxmlutils.hpp"
+#include "spxmlstag.hpp"
+#include "spxmlevent.hpp"
+#include "spxmlcodec.hpp"
+
+//=========================================================
+
+SP_XmlReader :: SP_XmlReader()
+{
+    mBuffer = new SP_XmlStringBuffer();
+}
+
+SP_XmlReader :: ~SP_XmlReader()
+{
+    delete mBuffer;
+}
+
+void SP_XmlReader :: changeReader(
+        SP_XmlPullParser * parser, SP_XmlReader * reader )
+{
+    parser->changeReader( reader );
+}
+
+SP_XmlReader * SP_XmlReader :: getReader( SP_XmlPullParser * parser, int type )
+{
+    return parser->getReader( type );
+}
+
+void SP_XmlReader :: setError( SP_XmlPullParser * parser, const char * error )
+{
+    parser->setError( error );
+}
+
+void SP_XmlReader :: reset()
+{
+    mBuffer->clean();
+}
+
+//=========================================================
+
+SP_XmlPIReader :: SP_XmlPIReader()
+{
+}
+
+SP_XmlPIReader :: ~SP_XmlPIReader()
+{
+}
+
+void SP_XmlPIReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '>' == c ) {
+        changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlPIReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlPullEvent * retEvent = NULL;
+
+    if( mBuffer->getSize() > 0 ) {
+        char * begin = (char*)mBuffer->getBuffer();
+        for( ; isspace( *begin ); ) begin++;
+
+        char * end = begin;
+        for( ; '\0' != *end && '?' != *end && ( ! isspace( *end ) ); ) end++;
+
+        char savedChar = *end;
+        *end = '\0';
+
+        if( 0 == strcasecmp( begin, "xml" ) ) {
+            *end = savedChar;
+
+            retEvent = parseDocDeclEvent( parser, mBuffer );
+        } else {
+            SP_XmlPIEvent * piEvent = new SP_XmlPIEvent();
+            piEvent->setTarget( begin );
+
+            *end = savedChar;
+
+            begin = end;
+            for( ; isspace( *begin ); ) begin++;
+
+            end = begin;
+            for( ; '\0' != *end && '?' != *end; ) end++;
+
+            piEvent->setData( begin, end - begin );
+
+            retEvent = piEvent;
+        }
+    }
+
+    return retEvent;
+}
+
+SP_XmlPullEvent * SP_XmlPIReader :: parseDocDeclEvent( SP_XmlPullParser * parser,
+        SP_XmlStringBuffer * buffer )
+{
+    SP_XmlDocDeclEvent * retEvent = NULL;
+
+    SP_XmlSTagParser tagParser( parser->getEncoding() );
+
+    tagParser.append( buffer->getBuffer(), buffer->getSize() );
+    tagParser.append( " ", 1 );
+
+    if( NULL == tagParser.getError() ) {
+        SP_XmlStartTagEvent * event = tagParser.takeEvent();
+
+        const char * version = event->getAttrValue( "version" );
+        const char * encoding = event->getAttrValue( "encoding" );
+        const char * standalone = event->getAttrValue( "standalone" );
+
+        retEvent = new SP_XmlDocDeclEvent();
+        retEvent->setVersion( NULL == version ? "" : version );
+        retEvent->setEncoding( NULL == encoding ? "" : encoding );
+        if( NULL != standalone ) {
+            if( 0 == strcasecmp( "no", standalone ) ) {
+                retEvent->setStandalone( 0 );
+            } else {
+                retEvent->setStandalone( 1 );
+            }
+        }
+
+        delete event;
+    } else {
+        setError( parser, tagParser.getError() );
+    }
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlStartTagReader :: SP_XmlStartTagReader()
+{
+    mIsQuot = 0;
+}
+
+SP_XmlStartTagReader :: ~SP_XmlStartTagReader()
+{
+}
+
+void SP_XmlStartTagReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '>' == c && 0 == mIsQuot ) {
+        changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+    } else if( '/' == c && 0 == mIsQuot ) {
+        SP_XmlReader * reader = getReader( parser, SP_XmlReader::eETag );
+        const char * pos = mBuffer->getBuffer();
+        for( ; isspace( *pos ); ) pos++;
+        for( ; 0 == isspace( *pos ) && '\0' != *pos; pos++ ) {
+            reader->read( parser, *pos );
+        }
+        changeReader( parser, reader );
+    } else if( '<' == c && 0 == mIsQuot ) {
+        setError( parser, "illegal char" );
+    } else {
+        mBuffer->append( c );
+
+        if( 0 == mIsQuot ) {
+            if( '\'' == c ) mIsQuot = 1;
+            if( '"' == c ) mIsQuot = 2;
+        } else {
+            if( 1 == mIsQuot && '\'' == c ) mIsQuot = 0;
+            if( 2 == mIsQuot && '"' == c ) mIsQuot = 0;
+        }
+    }
+}
+
+SP_XmlPullEvent * SP_XmlStartTagReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlStartTagEvent * retEvent = NULL;
+
+    SP_XmlSTagParser tagParser( parser->getEncoding() );
+    tagParser.append( mBuffer->getBuffer(), mBuffer->getSize() );
+    tagParser.append( " ", 1 );
+
+    if( NULL == tagParser.getError() ) {
+        retEvent = tagParser.takeEvent();
+    } else {
+        setError( parser, tagParser.getError() );
+    }
+
+    return retEvent;
+}
+
+void SP_XmlStartTagReader :: reset()
+{
+    SP_XmlReader::reset();
+    mIsQuot = 0;
+}
+
+//=========================================================
+
+SP_XmlEndTagReader :: SP_XmlEndTagReader()
+{
+}
+
+SP_XmlEndTagReader :: ~SP_XmlEndTagReader()
+{
+}
+
+void SP_XmlEndTagReader :: read( SP_XmlPullParser * parser,    char c )
+{
+    if( '>' == c ) {
+        changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+    } else if( '/' == c ) {
+        setError( parser, "illegal name char" );
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlEndTagReader :: getEvent( SP_XmlPullParser * parser )
+{
+    const char * end = mBuffer->getBuffer() + mBuffer->getSize() - 1;
+
+    for( ; end > mBuffer->getBuffer() && isspace( *end ); ) end--;
+
+    SP_XmlEndTagEvent * retEvent = new SP_XmlEndTagEvent();
+    retEvent->setText( mBuffer->getBuffer(), end - mBuffer->getBuffer() + 1 );
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlPCDataReader :: SP_XmlPCDataReader()
+{
+}
+
+SP_XmlPCDataReader :: ~SP_XmlPCDataReader()
+{
+}
+
+void SP_XmlPCDataReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '<' == c ) {
+        SP_XmlReader * reader = getReader( parser, SP_XmlReader::eLBracket );
+        reader->read( parser, c );
+        changeReader( parser, reader );
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlPCDataReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlCDataEvent * retEvent = NULL;
+
+    int ignore = 0;
+
+    if( 0 != parser->getIgnoreWhitespace() ) {
+        ignore = 1;
+        for( const char * pos = mBuffer->getBuffer(); '\0' != *pos; pos++ ) {
+            if( !isspace( *pos ) ) {
+                ignore = 0;
+                break;
+            }
+        }
+    }
+
+    if( 0 == ignore && mBuffer->getSize() > 0 ) {
+        retEvent = new SP_XmlCDataEvent();
+        SP_XmlStringBuffer buffer;
+        SP_XmlStringCodec::decode( parser->getEncoding(), mBuffer->getBuffer(), &buffer );
+        retEvent->setText( buffer.getBuffer(), buffer.getSize() );
+    }
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlCDataSectionReader :: SP_XmlCDataSectionReader()
+{
+}
+
+SP_XmlCDataSectionReader :: ~SP_XmlCDataSectionReader()
+{
+}
+
+void SP_XmlCDataSectionReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '>' == c && mBuffer->getSize() > 2 ) {
+        char last1 = mBuffer->getBuffer()[ mBuffer->getSize() - 1 ];
+        char last2 = mBuffer->getBuffer()[ mBuffer->getSize() - 2 ];
+
+        if( ']' == last1 && ']' == last2 ) {
+            changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+        } else {
+            mBuffer->append( c );
+        }
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlCDataSectionReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlCDataEvent * retEvent = NULL;
+
+    int len = mBuffer->getSize();
+    const char * data = mBuffer->getBuffer();
+    if( 0 == strncmp( data, "CDATA[", strlen( "CDATA[" ) ) ) {
+        data += strlen( "CDATA[" );
+        len -= strlen( "CDATA[" );
+    }
+
+    int ignore = 0;
+    if( 0 != parser->getIgnoreWhitespace() ) {
+        ignore = 1;
+        for( int i = 0; i < len - 2; i++ ) {
+            if( !isspace( data[i] ) ) {
+                ignore = 0;
+                break;
+            }
+        }
+    }
+
+    if( 0 == ignore && len > 2 ) {
+        retEvent = new SP_XmlCDataEvent();
+        retEvent->setText( data, len - 2 );
+    }
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlCommentReader :: SP_XmlCommentReader()
+{
+}
+
+SP_XmlCommentReader :: ~SP_XmlCommentReader()
+{
+}
+
+void SP_XmlCommentReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '>' == c && mBuffer->getSize() >= 2 ) {
+        int size = mBuffer->getSize();
+        if( '-' == mBuffer->getBuffer()[ size - 1 ]
+                && '-' == mBuffer->getBuffer()[ size - 2 ] ) {
+            changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+        } else {
+            mBuffer->append( c );
+        }
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlCommentReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlCommentEvent * retEvent = new SP_XmlCommentEvent();
+
+    retEvent->setText( mBuffer->getBuffer(), mBuffer->getSize() - 2 );
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlDocTypeReader :: SP_XmlDocTypeReader()
+{
+}
+
+SP_XmlDocTypeReader :: ~SP_XmlDocTypeReader()
+{
+}
+
+void SP_XmlDocTypeReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '>' == c ) {
+        if( NULL != strchr( mBuffer->getBuffer(), '[' ) ) {
+            char last = mBuffer->getBuffer()[ mBuffer->getSize() - 1 ];
+            if( ']' == last ) {
+                changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+            } else {
+                mBuffer->append( c );
+            }
+        } else {
+            changeReader( parser, getReader( parser, SP_XmlReader::ePCData ) );
+        }
+    } else {
+        mBuffer->append( c );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlDocTypeReader :: getEvent( SP_XmlPullParser * parser )
+{
+    SP_XmlDocTypeEvent * retEvent = NULL;
+
+    SP_XmlSTagParser tagParser( parser->getEncoding() );
+
+    tagParser.append( "DOCTYPE ", strlen( "DOCTYPE " ) );
+    tagParser.append( mBuffer->getBuffer(), mBuffer->getSize() );
+    tagParser.append( " ", 1 );
+    if( NULL == tagParser.getError() ) {
+        SP_XmlStartTagEvent * event = tagParser.takeEvent();
+
+        retEvent = new SP_XmlDocTypeEvent();
+
+        for( int i = 0; i < event->getAttrCount(); i += 2 ) {
+            const char * name = event->getAttr( i, NULL );
+            if( 0 == strcmp( name, "DOCTYPE" ) ) {
+                name = event->getAttr( i + 1, NULL );
+                retEvent->setName( NULL == name ? "" : name );    
+            } else if( 0 == strcmp( name, "PUBLIC" ) ) {
+                name = event->getAttr( i + 1, NULL );
+                retEvent->setPublicID( NULL == name ? "" : name );
+            } else if( 0 == strcmp( name, "SYSTEM" ) ) {
+                name = event->getAttr( i + 1, NULL );
+                retEvent->setSystemID( NULL == name ? "" : name );
+            } else if( NULL != strstr( name, ".dtd" ) ) {
+                retEvent->setDTD( name );
+            }
+        }
+
+        delete event;
+    } else {
+        //setError( parser, tagParser.getError() );
+    }
+
+    return retEvent;
+}
+
+//=========================================================
+
+SP_XmlLeftBracketReader :: SP_XmlLeftBracketReader()
+{
+    mHasReadBracket = 0;
+}
+
+SP_XmlLeftBracketReader :: ~SP_XmlLeftBracketReader()
+{
+}
+
+void SP_XmlLeftBracketReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( 0 == mHasReadBracket ) {
+        if( isspace( c ) ) {
+            //skip
+        } else if( '<' == c ) {
+            mHasReadBracket = 1;
+        }
+    } else {
+        if( '?' == c ) {
+            changeReader( parser, getReader( parser, SP_XmlReader::ePI ) );
+        } else if( '/' == c ) {
+            changeReader( parser, getReader( parser, SP_XmlReader::eETag ) );
+        } else if( '!' == c ) {
+            changeReader( parser, getReader( parser, SP_XmlReader::eSign ) );
+        } else if( SP_XmlStringCodec::isNameChar( parser->getEncoding(), c ) ) {
+            SP_XmlReader * reader = getReader( parser, SP_XmlReader::eSTag );
+            reader->read( parser, c );
+            changeReader( parser, reader );
+        } else {
+            setError( parser, "not well-formed" );
+        }
+    }
+}
+
+SP_XmlPullEvent * SP_XmlLeftBracketReader :: getEvent( SP_XmlPullParser * parser )
+{
+    return NULL;
+}
+
+void SP_XmlLeftBracketReader :: reset()
+{
+    SP_XmlReader::reset();
+    mHasReadBracket = 0;
+}
+
+//=========================================================
+
+SP_XmlSignReader :: SP_XmlSignReader()
+{
+}
+
+SP_XmlSignReader :: ~SP_XmlSignReader()
+{
+}
+
+void SP_XmlSignReader :: read( SP_XmlPullParser * parser, char c )
+{
+    if( '[' == c ) {
+        changeReader( parser, getReader( parser, SP_XmlReader::eCDataSection ) );
+    } else if( '-' == c ) {
+        changeReader( parser, getReader( parser, SP_XmlReader::eComment ) );
+    } else if( isupper( c ) ) {
+        SP_XmlReader * reader = getReader( parser, SP_XmlReader::eDocType );
+        reader->read( parser, c );
+        changeReader( parser, reader );
+    } else {
+        setError( parser, "not well-formed" );
+    }
+}
+
+SP_XmlPullEvent * SP_XmlSignReader :: getEvent( SP_XmlPullParser * parser )
+{
+    return NULL;
+}
+
+//=========================================================
+
+SP_XmlReaderPool :: SP_XmlReaderPool()
+{
+    mReaderList = (SP_XmlReader**)malloc( sizeof( void * ) * SP_XmlReader::MAX_READER );
+    memset( mReaderList, 0, sizeof( void * ) * SP_XmlReader::MAX_READER );
+}
+
+SP_XmlReaderPool :: ~SP_XmlReaderPool()
+{
+    for( int i = 0; i < SP_XmlReader::MAX_READER; i++ ) {
+        if( NULL != mReaderList[i] ) {
+            delete mReaderList[i];
+        }
+    }
+    free( mReaderList );
+}
+
+SP_XmlReader * SP_XmlReaderPool :: borrow( int type )
+{
+    SP_XmlReader * reader = NULL;
+
+    if( type >= 0 && type < SP_XmlReader::MAX_READER ) {
+        reader = mReaderList[ type ];
+        if( NULL == reader ) {
+            switch( type ) {
+            case SP_XmlReader::ePI: reader = new SP_XmlPIReader(); break;
+            case SP_XmlReader::eSTag: reader = new SP_XmlStartTagReader(); break;
+            case SP_XmlReader::eETag: reader = new SP_XmlEndTagReader(); break;
+            case SP_XmlReader::ePCData: reader = new SP_XmlPCDataReader(); break;
+            case SP_XmlReader::eCDataSection: reader = new SP_XmlCDataSectionReader(); break;
+            case SP_XmlReader::eComment: reader = new SP_XmlCommentReader(); break;
+            case SP_XmlReader::eDocType: reader = new SP_XmlDocTypeReader(); break;
+            case SP_XmlReader::eLBracket: reader = new SP_XmlLeftBracketReader(); break;
+            case SP_XmlReader::eSign: reader = new SP_XmlSignReader(); break;
+            }
+            mReaderList[ type ] = reader;
+        }
+    }
+
+    //printf( "\nborrow change: %s\n", typeid( *reader ).name() );
+
+    return reader;
+}
+
+void SP_XmlReaderPool :: save( SP_XmlReader * reader )
+{
+    //printf( "\nreturn change: %s\n", typeid( *reader ).name() );
+    reader->reset();
+}
+
+//=========================================================
+