tinyxml2/tinyxml2.cpp

793 lines
16 KiB
C++

#include "tinyxml2.h"
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#include <ctype.h>
using namespace tinyxml2;
static const char LINE_FEED = (char)0x0a; // all line endings are normalized to LF
static const char LF = LINE_FEED;
static const char CARRIAGE_RETURN = (char)0x0d; // CR gets filtered out
static const char CR = CARRIAGE_RETURN;
static const char SINGLE_QUOTE = '\'';
static const char DOUBLE_QUOTE = '\"';
struct Entity {
const char* pattern;
int length;
char value;
};
static const int NUM_ENTITIES = 5;
static const Entity entities[NUM_ENTITIES] =
{
{ "quot", 4, DOUBLE_QUOTE },
{ "amp", 3, '&' },
{ "apos", 4, SINGLE_QUOTE },
{ "lt", 2, '<' },
{ "gt", 2, '>' }
};
const char* StrPair::GetStr()
{
if ( flags & NEEDS_FLUSH ) {
*end = 0;
flags ^= NEEDS_FLUSH;
if ( flags ) {
char* p = start;
char* q = start;
while( p < end ) {
if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == CR ) {
// CR-LF pair becomes LF
// CR alone becomes LF
// LF-CR becomes LF
if ( *(p+1) == LF ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
else if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == LF ) {
if ( *(p+1) == CR ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
else if ( (flags & NEEDS_ENTITY_PROCESSING) && *p == '&' ) {
int i=0;
for( i=0; i<NUM_ENTITIES; ++i ) {
if ( strncmp( p+1, entities[i].pattern, entities[i].length ) == 0
&& *(p+entities[i].length+1) == ';' )
{
// Found an entity convert;
*q = entities[i].value;
++q;
p += entities[i].length + 2;
break;
}
}
if ( i == NUM_ENTITIES ) {
// fixme: treat as error?
++p;
++q;
}
}
else {
*q = *p;
++p;
++q;
}
}
*q = 0;
}
flags = 0;
}
return start;
}
/*
const char* StringPool::Intern( const char* str )
{
// Treat the array as a linear, inplace hash table.
// Nothing can get deleted, so that's handy.
if ( size > pool.Size()*3/4 ) {
DynArray< const char*, 20 > store;
for( int i=0; i<pool.Size(); ++i ) {
if ( pool[i] != 0 ) {
store.Push( pool[i] );
}
}
int newSize = pool.Size() * 2;
pool.PopArr( pool.Size() );
const char** mem = pool.PushArr( newSize );
memset( (void*)mem, 0, sizeof(char)*newSize );
while ( !store.Empty() ) {
Intern( store.Pop() );
}
}
}
*/
// --------- XMLBase ----------- //
// fixme: should take in the entity/newline flags as param
char* XMLBase::ParseText( char* p, StrPair* pair, const char* endTag, int strFlags )
{
TIXMLASSERT( endTag && *endTag );
char* start = p;
char endChar = *endTag;
int length = strlen( endTag );
// Inner loop of text parsing.
while ( *p ) {
if ( *p == endChar && strncmp( p, endTag, length ) == 0 ) {
pair->Set( start, p, strFlags );
return p + length;
}
++p;
}
return p;
}
char* XMLBase::ParseName( char* p, StrPair* pair )
{
char* start = p;
start = p;
if ( !start || !(*start) ) {
return 0;
}
if ( !IsAlpha( *p ) ) {
return 0;
}
while( *p && (
IsAlphaNum( (unsigned char) *p )
|| *p == '_'
|| *p == '-'
|| *p == '.'
|| *p == ':' ))
{
++p;
}
if ( p > start ) {
pair->Set( start, p, 0 );
return p;
}
return 0;
}
char* XMLBase::Identify( XMLDocument* document, char* p, XMLNode** node )
{
XMLNode* returnNode = 0;
char* start = p;
p = XMLNode::SkipWhiteSpace( p );
if( !p || !*p )
{
return 0;
}
// What is this thing?
// - Elements start with a letter or underscore, but xml is reserved.
// - Comments: <!--
// - Decleration: <?xml
// - Everthing else is unknown to tinyxml.
//
static const char* xmlHeader = { "<?xml" };
static const char* commentHeader = { "<!--" };
static const char* dtdHeader = { "<!" };
static const char* cdataHeader = { "<![CDATA[" };
static const char* elementHeader = { "<" }; // and a header for everything else; check last.
static const int xmlHeaderLen = 5;
static const int commentHeaderLen = 4;
static const int dtdHeaderLen = 2;
static const int cdataHeaderLen = 9;
static const int elementHeaderLen = 1;
if ( StringEqual( p, commentHeader, commentHeaderLen ) ) {
returnNode = new XMLComment( document );
p += commentHeaderLen;
}
else if ( StringEqual( p, elementHeader, elementHeaderLen ) ) {
returnNode = new XMLElement( document );
p += elementHeaderLen;
}
// fixme: better text detection
else if ( (*p != '<') && IsAlphaNum( *p ) ) {
// fixme: this is filtering out empty text...should it?
returnNode = new XMLText( document );
p = start; // Back it up, all the text counts.
}
else {
TIXMLASSERT( 0 );
}
*node = returnNode;
return p;
}
// --------- XMLNode ----------- //
XMLNode::XMLNode( XMLDocument* doc ) :
document( doc ),
parent( 0 ),
isTextParent( false ),
firstChild( 0 ), lastChild( 0 ),
prev( 0 ), next( 0 )
{
}
XMLNode::~XMLNode()
{
ClearChildren();
if ( parent ) {
parent->Unlink( this );
}
}
void XMLNode::ClearChildren()
{
while( firstChild ) {
XMLNode* node = firstChild;
Unlink( node );
delete node;
}
firstChild = lastChild = 0;
}
void XMLNode::Unlink( XMLNode* child )
{
TIXMLASSERT( child->parent == this );
if ( child == firstChild )
firstChild = firstChild->next;
if ( child == lastChild )
lastChild = lastChild->prev;
if ( child->prev ) {
child->prev->next = child->next;
}
if ( child->next ) {
child->next->prev = child->prev;
}
child->parent = 0;
}
XMLNode* XMLNode::InsertEndChild( XMLNode* addThis )
{
if ( lastChild ) {
TIXMLASSERT( firstChild );
TIXMLASSERT( lastChild->next == 0 );
lastChild->next = addThis;
addThis->prev = lastChild;
lastChild = addThis;
addThis->parent = this;
addThis->next = 0;
}
else {
TIXMLASSERT( firstChild == 0 );
firstChild = lastChild = addThis;
addThis->parent = this;
addThis->prev = 0;
addThis->next = 0;
}
if ( addThis->ToText() ) {
SetTextParent();
}
return addThis;
}
XMLElement* XMLNode::FirstChildElement( const char* value )
{
for( XMLNode* node=firstChild; node; node=node->next ) {
XMLElement* element = node->ToElement();
if ( element ) {
if ( !value || StringEqual( element->Name(), value ) ) {
return element;
}
}
}
return 0;
}
void XMLNode::Print( XMLStreamer* streamer )
{
for( XMLNode* node = firstChild; node; node=node->next ) {
node->Print( streamer );
}
}
char* XMLNode::ParseDeep( char* p )
{
while( p && *p ) {
XMLNode* node = 0;
p = Identify( document, p, &node );
if ( p && node ) {
p = node->ParseDeep( p );
// FIXME: is it the correct closing element?
if ( node->IsClosingElement() ) {
delete node;
return p;
}
this->InsertEndChild( node );
}
}
return 0;
}
// --------- XMLText ---------- //
char* XMLText::ParseDeep( char* p )
{
p = ParseText( p, &value, "<", StrPair::TEXT_ELEMENT );
// consumes the end tag.
if ( p && *p ) {
return p-1;
}
return 0;
}
void XMLText::Print( XMLStreamer* streamer )
{
const char* v = value.GetStr();
streamer->PushText( v );
}
// --------- XMLComment ---------- //
XMLComment::XMLComment( XMLDocument* doc ) : XMLNode( doc )
{
}
XMLComment::~XMLComment()
{
//printf( "~XMLComment\n" );
}
void XMLComment::Print( XMLStreamer* streamer )
{
// XMLNode::Print( fp, depth );
// fprintf( fp, "<!--%s-->\n", value.GetStr() );
streamer->PushComment( value.GetStr() );
}
char* XMLComment::ParseDeep( char* p )
{
// Comment parses as text.
return ParseText( p, &value, "-->", StrPair::COMMENT );
}
// --------- XMLAttribute ---------- //
char* XMLAttribute::ParseDeep( char* p )
{
p = ParseText( p, &name, "=", StrPair::ATTRIBUTE_NAME );
if ( !p || !*p ) return 0;
char endTag[2] = { *p, 0 };
++p;
p = ParseText( p, &value, endTag, StrPair::ATTRIBUTE_VALUE );
if ( value.Empty() ) return 0;
return p;
}
void XMLAttribute::Print( XMLStreamer* streamer )
{
// fixme: sort out single vs. double quote
//fprintf( cfile, "%s=\"%s\"", name.GetStr(), value.GetStr() );
streamer->PushAttribute( name.GetStr(), value.GetStr() );
}
// --------- XMLElement ---------- //
XMLElement::XMLElement( XMLDocument* doc ) : XMLNode( doc ),
closing( false ),
rootAttribute( 0 ),
lastAttribute( 0 )
{
}
XMLElement::~XMLElement()
{
//printf( "~XMLElemen %x\n",this );
XMLAttribute* attribute = rootAttribute;
while( attribute ) {
XMLAttribute* next = attribute->next;
delete attribute;
attribute = next;
}
}
char* XMLElement::ParseAttributes( char* p, bool* closedElement )
{
const char* start = p;
*closedElement = false;
// Read the attributes.
while( p ) {
p = SkipWhiteSpace( p );
if ( !p || !(*p) ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, name.GetStr() );
return 0;
}
// attribute.
if ( IsAlpha( *p ) ) {
XMLAttribute* attrib = new XMLAttribute( this );
p = attrib->ParseDeep( p );
if ( !p ) {
delete attrib;
document->SetError( XMLDocument::ERROR_PARSING_ATTRIBUTE, start, p );
return 0;
}
if ( rootAttribute ) {
TIXMLASSERT( lastAttribute );
lastAttribute->next = attrib;
lastAttribute = attrib;
}
else {
rootAttribute = lastAttribute = attrib;
}
}
// end of the tag
else if ( *p == '/' && *(p+1) == '>' ) {
if ( closing ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
*closedElement = true;
return p+2; // done; sealed element.
}
// end of the tag
else if ( *p == '>' ) {
++p;
break;
}
else {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
}
return p;
}
//
// <ele></ele>
// <ele>foo<b>bar</b></ele>
//
char* XMLElement::ParseDeep( char* p )
{
// Read the element name.
p = SkipWhiteSpace( p );
if ( !p ) return 0;
const char* start = p;
// The closing element is the </element> form. It is
// parsed just like a regular element then deleted from
// the DOM.
if ( *p == '/' ) {
closing = true;
++p;
}
p = ParseName( p, &name );
if ( name.Empty() ) return 0;
bool elementClosed=false;
p = ParseAttributes( p, &elementClosed );
if ( !p || !*p || elementClosed || closing )
return p;
p = XMLNode::ParseDeep( p );
return p;
}
void XMLElement::Print( XMLStreamer* streamer )
{
//if ( !parent || !parent->IsTextParent() ) {
// PrintSpace( cfile, depth );
//}
//fprintf( cfile, "<%s", Name() );
streamer->OpenElement( Name(), IsTextParent() );
for( XMLAttribute* attrib=rootAttribute; attrib; attrib=attrib->next ) {
//fprintf( cfile, " " );
attrib->Print( streamer );
}
for( XMLNode* node=firstChild; node; node=node->next ) {
node->Print( streamer );
}
streamer->CloseElement();
}
// --------- XMLDocument ----------- //
XMLDocument::XMLDocument() :
XMLNode( 0 ),
charBuffer( 0 )
{
document = this; // avoid warning about 'this' in initializer list
}
XMLDocument::~XMLDocument()
{
delete [] charBuffer;
}
void XMLDocument::InitDocument()
{
errorID = NO_ERROR;
errorStr1 = 0;
errorStr2 = 0;
delete [] charBuffer;
charBuffer = 0;
}
XMLElement* XMLDocument::NewElement( const char* name )
{
XMLElement* ele = new XMLElement( this );
ele->SetName( name );
return ele;
}
int XMLDocument::Parse( const char* p )
{
ClearChildren();
InitDocument();
if ( !p || !*p ) {
return true; // correctly parse an empty string?
}
size_t len = strlen( p );
charBuffer = new char[ len+1 ];
memcpy( charBuffer, p, len+1 );
XMLNode* node = 0;
char* q = ParseDeep( charBuffer );
return errorID;
}
void XMLDocument::Print( XMLStreamer* streamer )
{
XMLStreamer stdStreamer( stdout );
if ( !streamer )
streamer = &stdStreamer;
for( XMLNode* node = firstChild; node; node=node->next ) {
node->Print( streamer );
}
}
void XMLDocument::SetError( int error, const char* str1, const char* str2 )
{
errorID = error;
printf( "ERROR: id=%d '%s' '%s'\n", error, str1, str2 ); // fixme: remove
errorStr1 = str1;
errorStr2 = str2;
}
/*
StringStack::StringStack()
{
nPositive = 0;
mem.Push( 0 ); // start with null. makes later code simpler.
}
StringStack::~StringStack()
{
}
void StringStack::Push( const char* str ) {
int needed = strlen( str ) + 1;
char* p = mem.PushArr( needed );
strcpy( p, str );
if ( needed > 1 )
nPositive++;
}
const char* StringStack::Pop() {
TIXMLASSERT( mem.Size() > 1 );
const char* p = mem.Mem() + mem.Size() - 2; // end of final string.
if ( *p ) {
nPositive--;
}
while( *p ) { // stack starts with a null, don't need to check for 'mem'
TIXMLASSERT( p > mem.Mem() );
--p;
}
mem.PopArr( strlen(p)+1 );
return p+1;
}
*/
XMLStreamer::XMLStreamer( FILE* file ) : fp( file ), depth( 0 ), elementJustOpened( false )
{
for( int i=0; i<ENTITY_RANGE; ++i ) {
entityFlag[i] = false;
}
for( int i=0; i<NUM_ENTITIES; ++i ) {
TIXMLASSERT( entities[i].value < ENTITY_RANGE );
if ( entities[i].value < ENTITY_RANGE ) {
entityFlag[ entities[i].value ] = true;
}
}
}
void XMLStreamer::PrintSpace( int depth )
{
for( int i=0; i<depth; ++i ) {
fprintf( fp, " " );
}
}
void XMLStreamer::PrintString( const char* p )
{
// Look for runs of bytes between entities to print.
const char* q = p;
while ( *q ) {
if ( *q < ENTITY_RANGE ) {
// Check for entities. If one is found, flush
// the stream up until the entity, write the
// entity, and keep looking.
if ( entityFlag[*q] ) {
while ( p < q ) {
fputc( *p, fp );
++p;
}
for( int i=0; i<NUM_ENTITIES; ++i ) {
if ( entities[i].value == *q ) {
fprintf( fp, "&%s;", entities[i].pattern );
break;
}
}
++p;
}
}
++q;
}
// Flush the remaining string. This will be the entire
// string if an entity wasn't found.
if ( q-p > 0 ) {
fprintf( fp, "%s", p );
}
}
void XMLStreamer::OpenElement( const char* name, bool textParent )
{
if ( elementJustOpened ) {
SealElement();
}
if ( !TextOnStack() ) {
PrintSpace( depth );
}
stack.Push( name );
text.Push( textParent ? 'T' : 'e' );
// fixme: can names have entities?
fprintf( fp, "<%s", name );
elementJustOpened = true;
++depth;
}
void XMLStreamer::PushAttribute( const char* name, const char* value )
{
TIXMLASSERT( elementJustOpened );
fprintf( fp, " %s=\"", name );
PrintString( value );
fprintf( fp, "\"" );
}
void XMLStreamer::CloseElement()
{
--depth;
const char* name = stack.Pop();
bool wasText = TextOnStack();
text.Pop();
if ( elementJustOpened ) {
fprintf( fp, "/>" );
if ( !wasText ) {
fprintf( fp, "\n" );
}
}
else {
if ( !wasText ) {
PrintSpace( depth );
}
// fixme can names have entities?
fprintf( fp, "</%s>", name );
if ( !TextOnStack() ) {
fprintf( fp, "\n" );
}
}
elementJustOpened = false;
}
void XMLStreamer::SealElement()
{
elementJustOpened = false;
fprintf( fp, ">" );
if ( !TextOnStack() ) {
fprintf( fp, "\n" );
}
}
void XMLStreamer::PushText( const char* text )
{
if ( elementJustOpened ) {
SealElement();
}
PrintString( text );
}
void XMLStreamer::PushComment( const char* comment )
{
if ( elementJustOpened ) {
SealElement();
}
PrintSpace( depth );
fprintf( fp, "<!--%s-->\n", comment );
}