| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809 |
- #include "tinyxml2.h"
- #include <string.h>
- #include <stdlib.h>
- #include <stdio.h>
- #include <ctype.h>
- using namespace tinyxml2;
- static const char LINE_FEED = (char)0x0a; // all line endings are normalized to LF
- static const char LF = LINE_FEED;
- static const char CARRIAGE_RETURN = (char)0x0d; // CR gets filtered out
- static const char CR = CARRIAGE_RETURN;
- static const char SINGLE_QUOTE = '\'';
- static const char DOUBLE_QUOTE = '\"';
- struct Entity {
- const char* pattern;
- int length;
- char value;
- };
- static const int NUM_ENTITIES = 5;
- static const Entity entities[NUM_ENTITIES] =
- {
- { "quot", 4, DOUBLE_QUOTE },
- { "amp", 3, '&' },
- { "apos", 4, SINGLE_QUOTE },
- { "lt", 2, '<' },
- { "gt", 2, '>' }
- };
- const char* StrPair::GetStr()
- {
- if ( flags & NEEDS_FLUSH ) {
- *end = 0;
- flags ^= NEEDS_FLUSH;
- if ( flags ) {
- char* p = start;
- char* q = start;
- while( p < end ) {
- if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == CR ) {
- // CR-LF pair becomes LF
- // CR alone becomes LF
- // LF-CR becomes LF
- if ( *(p+1) == LF ) {
- p += 2;
- }
- else {
- ++p;
- }
- *q = LF;
- }
- else if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == LF ) {
- if ( *(p+1) == CR ) {
- p += 2;
- }
- else {
- ++p;
- }
- *q = LF;
- }
- else if ( (flags & NEEDS_ENTITY_PROCESSING) && *p == '&' ) {
- int i=0;
- for( i=0; i<NUM_ENTITIES; ++i ) {
- if ( strncmp( p+1, entities[i].pattern, entities[i].length ) == 0
- && *(p+entities[i].length+1) == ';' )
- {
- // Found an entity convert;
- *q = entities[i].value;
- ++q;
- p += entities[i].length + 2;
- break;
- }
- }
- if ( i == NUM_ENTITIES ) {
- // fixme: treat as error?
- ++p;
- ++q;
- }
- }
- else {
- *q = *p;
- ++p;
- ++q;
- }
- }
- *q = 0;
- }
- flags = 0;
- }
- return start;
- }
- // --------- XMLBase ----------- //
- // fixme: should take in the entity/newline flags as param
- char* XMLBase::ParseText( char* p, StrPair* pair, const char* endTag, int strFlags )
- {
- TIXMLASSERT( endTag && *endTag );
- char* start = p;
- char endChar = *endTag;
- int length = strlen( endTag );
- // Inner loop of text parsing.
- while ( *p ) {
- if ( *p == endChar && strncmp( p, endTag, length ) == 0 ) {
- pair->Set( start, p, strFlags );
- return p + length;
- }
- ++p;
- }
- return p;
- }
- char* XMLBase::ParseName( char* p, StrPair* pair )
- {
- char* start = p;
- start = p;
- if ( !start || !(*start) ) {
- return 0;
- }
- if ( !IsAlpha( *p ) ) {
- return 0;
- }
- while( *p && (
- IsAlphaNum( (unsigned char) *p )
- || *p == '_'
- || *p == '-'
- || *p == '.'
- || *p == ':' ))
- {
- ++p;
- }
- if ( p > start ) {
- pair->Set( start, p, 0 );
- return p;
- }
- return 0;
- }
- char* XMLBase::Identify( XMLDocument* document, char* p, XMLNode** node )
- {
- XMLNode* returnNode = 0;
- char* start = p;
- p = XMLNode::SkipWhiteSpace( p );
- if( !p || !*p )
- {
- return 0;
- }
- // What is this thing?
- // - Elements start with a letter or underscore, but xml is reserved.
- // - Comments: <!--
- // - Decleration: <?xml
- // - Everthing else is unknown to tinyxml.
- //
- static const char* xmlHeader = { "<?xml" };
- static const char* commentHeader = { "<!--" };
- static const char* dtdHeader = { "<!" };
- static const char* cdataHeader = { "<![CDATA[" };
- static const char* elementHeader = { "<" }; // and a header for everything else; check last.
- static const int xmlHeaderLen = 5;
- static const int commentHeaderLen = 4;
- static const int dtdHeaderLen = 2;
- static const int cdataHeaderLen = 9;
- static const int elementHeaderLen = 1;
- if ( StringEqual( p, commentHeader, commentHeaderLen ) ) {
- returnNode = new XMLComment( document );
- p += commentHeaderLen;
- }
- else if ( StringEqual( p, elementHeader, elementHeaderLen ) ) {
- returnNode = new XMLElement( document );
- p += elementHeaderLen;
- }
- // fixme: better text detection
- else if ( (*p != '<') && IsAlphaNum( *p ) ) {
- // fixme: this is filtering out empty text...should it?
- returnNode = new XMLText( document );
- p = start; // Back it up, all the text counts.
- }
- else {
- TIXMLASSERT( 0 );
- }
- *node = returnNode;
- return p;
- }
- // --------- XMLNode ----------- //
- XMLNode::XMLNode( XMLDocument* doc ) :
- document( doc ),
- parent( 0 ),
- isTextParent( false ),
- firstChild( 0 ), lastChild( 0 ),
- prev( 0 ), next( 0 )
- {
- }
- XMLNode::~XMLNode()
- {
- ClearChildren();
- if ( parent ) {
- parent->Unlink( this );
- }
- }
- void XMLNode::ClearChildren()
- {
- while( firstChild ) {
- XMLNode* node = firstChild;
- Unlink( node );
- delete node;
- }
- firstChild = lastChild = 0;
- }
- void XMLNode::Unlink( XMLNode* child )
- {
- TIXMLASSERT( child->parent == this );
- if ( child == firstChild )
- firstChild = firstChild->next;
- if ( child == lastChild )
- lastChild = lastChild->prev;
- if ( child->prev ) {
- child->prev->next = child->next;
- }
- if ( child->next ) {
- child->next->prev = child->prev;
- }
- child->parent = 0;
- }
- XMLNode* XMLNode::InsertEndChild( XMLNode* addThis )
- {
- if ( lastChild ) {
- TIXMLASSERT( firstChild );
- TIXMLASSERT( lastChild->next == 0 );
- lastChild->next = addThis;
- addThis->prev = lastChild;
- lastChild = addThis;
- addThis->parent = this;
- addThis->next = 0;
- }
- else {
- TIXMLASSERT( firstChild == 0 );
- firstChild = lastChild = addThis;
- addThis->parent = this;
- addThis->prev = 0;
- addThis->next = 0;
- }
- if ( addThis->ToText() ) {
- SetTextParent();
- }
- return addThis;
- }
- void XMLNode::Print( XMLStreamer* streamer )
- {
- for( XMLNode* node = firstChild; node; node=node->next ) {
- node->Print( streamer );
- }
- }
- char* XMLNode::ParseDeep( char* p )
- {
- while( p && *p ) {
- XMLNode* node = 0;
- p = Identify( document, p, &node );
- if ( p && node ) {
- p = node->ParseDeep( p );
- // FIXME: is it the correct closing element?
- if ( node->IsClosingElement() ) {
- delete node;
- return p;
- }
- this->InsertEndChild( node );
- }
- }
- return 0;
- }
- // --------- XMLText ---------- //
- char* XMLText::ParseDeep( char* p )
- {
- p = ParseText( p, &value, "<", StrPair::TEXT_ELEMENT );
- // consumes the end tag.
- if ( p && *p ) {
- return p-1;
- }
- return 0;
- }
- void XMLText::Print( XMLStreamer* streamer )
- {
- const char* v = value.GetStr();
- streamer->PushText( v );
- }
- // --------- XMLComment ---------- //
- XMLComment::XMLComment( XMLDocument* doc ) : XMLNode( doc )
- {
- }
- XMLComment::~XMLComment()
- {
- //printf( "~XMLComment\n" );
- }
- void XMLComment::Print( XMLStreamer* streamer )
- {
- // XMLNode::Print( fp, depth );
- // fprintf( fp, "<!--%s-->\n", value.GetStr() );
- streamer->PushComment( value.GetStr() );
- }
- char* XMLComment::ParseDeep( char* p )
- {
- // Comment parses as text.
- return ParseText( p, &value, "-->", StrPair::COMMENT );
- }
- // --------- XMLAttribute ---------- //
- char* XMLAttribute::ParseDeep( char* p )
- {
- p = ParseText( p, &name, "=", StrPair::ATTRIBUTE_NAME );
- if ( !p || !*p ) return 0;
- char endTag[2] = { *p, 0 };
- ++p;
- p = ParseText( p, &value, endTag, StrPair::ATTRIBUTE_VALUE );
- if ( value.Empty() ) return 0;
- return p;
- }
- void XMLAttribute::Print( XMLStreamer* streamer )
- {
- // fixme: sort out single vs. double quote
- //fprintf( cfile, "%s=\"%s\"", name.GetStr(), value.GetStr() );
- streamer->PushAttribute( name.GetStr(), value.GetStr() );
- }
- // --------- XMLElement ---------- //
- XMLElement::XMLElement( XMLDocument* doc ) : XMLNode( doc ),
- closing( false ),
- rootAttribute( 0 ),
- lastAttribute( 0 )
- {
- }
- XMLElement::~XMLElement()
- {
- //printf( "~XMLElemen %x\n",this );
- XMLAttribute* attribute = rootAttribute;
- while( attribute ) {
- XMLAttribute* next = attribute->next;
- delete attribute;
- attribute = next;
- }
- }
- char* XMLElement::ParseAttributes( char* p, bool* closedElement )
- {
- const char* start = p;
- *closedElement = false;
- // Read the attributes.
- while( p ) {
- p = SkipWhiteSpace( p );
- if ( !p || !(*p) ) {
- document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, name.GetStr() );
- return 0;
- }
- // attribute.
- if ( IsAlpha( *p ) ) {
- XMLAttribute* attrib = new XMLAttribute( this );
- p = attrib->ParseDeep( p );
- if ( !p ) {
- delete attrib;
- document->SetError( XMLDocument::ERROR_PARSING_ATTRIBUTE, start, p );
- return 0;
- }
- if ( rootAttribute ) {
- TIXMLASSERT( lastAttribute );
- lastAttribute->next = attrib;
- lastAttribute = attrib;
- }
- else {
- rootAttribute = lastAttribute = attrib;
- }
- }
- // end of the tag
- else if ( *p == '/' && *(p+1) == '>' ) {
- if ( closing ) {
- document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
- return 0;
- }
- *closedElement = true;
- return p+2; // done; sealed element.
- }
- // end of the tag
- else if ( *p == '>' ) {
- ++p;
- break;
- }
- else {
- document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
- return 0;
- }
- }
- return p;
- }
- //
- // <ele></ele>
- // <ele>foo<b>bar</b></ele>
- //
- char* XMLElement::ParseDeep( char* p )
- {
- // Read the element name.
- p = SkipWhiteSpace( p );
- if ( !p ) return 0;
- const char* start = p;
- // The closing element is the </element> form. It is
- // parsed just like a regular element then deleted from
- // the DOM.
- if ( *p == '/' ) {
- closing = true;
- ++p;
- }
- p = ParseName( p, &name );
- if ( name.Empty() ) return 0;
- bool elementClosed=false;
- p = ParseAttributes( p, &elementClosed );
- if ( !p || !*p || elementClosed || closing )
- return p;
- p = XMLNode::ParseDeep( p );
- return p;
- }
- void XMLElement::Print( XMLStreamer* streamer )
- {
- //if ( !parent || !parent->IsTextParent() ) {
- // PrintSpace( cfile, depth );
- //}
- //fprintf( cfile, "<%s", Name() );
- streamer->OpenElement( Name(), IsTextParent() );
- for( XMLAttribute* attrib=rootAttribute; attrib; attrib=attrib->next ) {
- //fprintf( cfile, " " );
- attrib->Print( streamer );
- }
- for( XMLNode* node=firstChild; node; node=node->next ) {
- node->Print( streamer );
- }
- streamer->CloseElement();
- }
- // --------- XMLDocument ----------- //
- XMLDocument::XMLDocument() :
- XMLNode( 0 ),
- charBuffer( 0 )
- {
- document = this; // avoid warning about 'this' in initializer list
- }
- XMLDocument::~XMLDocument()
- {
- delete [] charBuffer;
- }
- void XMLDocument::InitDocument()
- {
- errorID = NO_ERROR;
- errorStr1 = 0;
- errorStr2 = 0;
- delete [] charBuffer;
- charBuffer = 0;
- }
- int XMLDocument::Parse( const char* p )
- {
- ClearChildren();
- InitDocument();
- if ( !p || !*p ) {
- return true; // correctly parse an empty string?
- }
- size_t len = strlen( p );
- charBuffer = new char[ len+1 ];
- memcpy( charBuffer, p, len+1 );
- XMLNode* node = 0;
-
- char* q = ParseDeep( charBuffer );
- return errorID;
- }
- void XMLDocument::Print( XMLStreamer* streamer )
- {
- XMLStreamer stdStreamer( stdout );
- if ( !streamer )
- streamer = &stdStreamer;
- for( XMLNode* node = firstChild; node; node=node->next ) {
- node->Print( streamer );
- }
- }
- void XMLDocument::SetError( int error, const char* str1, const char* str2 )
- {
- errorID = error;
- printf( "ERROR: id=%d '%s' '%s'\n", error, str1, str2 ); // fixme: remove
- errorStr1 = str1;
- errorStr2 = str2;
- }
- StringStack::StringStack()
- {
- *pool = 0;
- mem = pool;
- inUse = 1; // always has a null
- allocated = INIT;
- nPositive = 0;
- }
- StringStack::~StringStack()
- {
- if ( mem != pool ) {
- delete [] mem;
- }
- }
- void StringStack::Push( const char* str ) {
- int needed = strlen( str ) + 1;
- if ( needed > 1 )
- nPositive++;
- if ( inUse+needed >= allocated ) {
- // fixme: power of 2
- // less stupid allocation
- int more = inUse+needed + 1000;
- char* newMem = new char[more];
- memcpy( newMem, mem, inUse );
- if ( mem != pool ) {
- delete [] mem;
- }
- mem = newMem;
- }
- strcpy( mem+inUse, str );
- inUse += needed;
- }
- const char* StringStack::Pop() {
- TIXMLASSERT( inUse > 1 );
- const char* p = mem+inUse-2;
- if ( *p ) {
- nPositive--;
- }
- while( *p ) { // stack starts with a null, don't need to check for 'mem'
- TIXMLASSERT( p > mem );
- --p;
- }
- inUse = p-mem+1;
- return p+1;
- }
- StringPtrStack::StringPtrStack()
- {
- *pool = 0;
- mem = pool;
- inUse = 0;
- allocated = INIT;
- nPositive = 0;
- }
- StringPtrStack::~StringPtrStack()
- {
- if ( mem != pool ) {
- delete [] mem;
- }
- }
- void StringPtrStack::Push( const char* str ) {
- int needed = inUse + 1;
- if ( str )
- nPositive++;
- if ( inUse+needed >= allocated ) {
- // fixme: power of 2
- // less stupid allocation
- int more = inUse+needed + 1000;
- char** newMem = new char*[more];
- memcpy( newMem, mem, inUse*sizeof(char*) );
- if ( mem != pool ) {
- delete [] mem;
- }
- mem = newMem;
- }
- mem[inUse] = (char*)str;
- inUse++;
- }
- const char* StringPtrStack::Pop() {
- TIXMLASSERT( inUse > 0 );
- inUse--;
- const char* result = mem[inUse];
- if ( result )
- nPositive--;
- return result;
- }
- XMLStreamer::XMLStreamer( FILE* file ) : fp( file ), depth( 0 ), elementJustOpened( false )
- {
- for( int i=0; i<ENTITY_RANGE; ++i ) {
- entityFlag[i] = false;
- }
- for( int i=0; i<NUM_ENTITIES; ++i ) {
- TIXMLASSERT( entities[i].value < ENTITY_RANGE );
- if ( entities[i].value < ENTITY_RANGE ) {
- entityFlag[ entities[i].value ] = true;
- }
- }
- }
- void XMLStreamer::PrintSpace( int depth )
- {
- for( int i=0; i<depth; ++i ) {
- fprintf( fp, " " );
- }
- }
- void XMLStreamer::PrintString( const char* p )
- {
- // Look for runs of bytes between entities to print.
- const char* q = p;
- while ( *q ) {
- if ( *q < ENTITY_RANGE ) {
- // Check for entities. If one is found, flush
- // the stream up until the entity, write the
- // entity, and keep looking.
- if ( entityFlag[*q] ) {
- while ( p < q ) {
- fputc( *p, fp );
- ++p;
- }
- for( int i=0; i<NUM_ENTITIES; ++i ) {
- if ( entities[i].value == *q ) {
- fprintf( fp, "&%s;", entities[i].pattern );
- break;
- }
- }
- ++p;
- }
- }
- ++q;
- }
- // Flush the remaining string. This will be the entire
- // string if an entity wasn't found.
- if ( q-p > 0 ) {
- fprintf( fp, "%s", p );
- }
- }
- void XMLStreamer::OpenElement( const char* name, bool textParent )
- {
- if ( elementJustOpened ) {
- SealElement();
- }
- if ( text.NumPositive() == 0 ) {
- PrintSpace( depth );
- }
- stack.Push( name );
- text.Push( textParent ? "T" : "" );
- // fixme: can names have entities?
- fprintf( fp, "<%s", name );
- elementJustOpened = true;
- ++depth;
- }
- void XMLStreamer::PushAttribute( const char* name, const char* value )
- {
- TIXMLASSERT( elementJustOpened );
- fprintf( fp, " %s=\"", name );
- PrintString( value );
- fprintf( fp, "\"" );
- }
- void XMLStreamer::CloseElement()
- {
- --depth;
- const char* name = stack.Pop();
- int wasPositive = text.NumPositive();
- text.Pop();
- if ( elementJustOpened ) {
- fprintf( fp, "/>" );
- if ( text.NumPositive() == 0 ) {
- fprintf( fp, "\n" );
- }
- }
- else {
- if ( wasPositive == 0 ) {
- PrintSpace( depth );
- }
- // fixme can names have entities?
- fprintf( fp, "</%s>", name );
- if ( text.NumPositive() == 0 ) {
- fprintf( fp, "\n" );
- }
- }
- elementJustOpened = false;
- }
- void XMLStreamer::SealElement()
- {
- elementJustOpened = false;
- fprintf( fp, ">" );
- if ( text.NumPositive() == 0 ) {
- fprintf( fp, "\n" );
- }
- }
- void XMLStreamer::PushText( const char* text )
- {
- if ( elementJustOpened ) {
- SealElement();
- }
- PrintString( text );
- }
- void XMLStreamer::PushComment( const char* comment )
- {
- if ( elementJustOpened ) {
- SealElement();
- }
- PrintSpace( depth );
- fprintf( fp, "<!--%s-->\n", comment );
- }
|