tinyxml2/tinyxml2.cpp

714 lines
14 KiB
C++
Raw Normal View History

2011-12-28 19:42:49 -08:00
#include "tinyxml2.h"
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
2011-12-31 14:58:18 -08:00
#include <ctype.h>
2011-12-28 19:42:49 -08:00
using namespace tinyxml2;
static const char LINE_FEED = (char)0x0a; // all line endings are normalized to LF
2012-01-14 18:08:12 -08:00
static const char LF = LINE_FEED;
static const char CARRIAGE_RETURN = (char)0x0d; // CR gets filtered out
static const char CR = CARRIAGE_RETURN;
static const char SINGLE_QUOTE = '\'';
static const char DOUBLE_QUOTE = '\"';
2012-01-14 18:08:12 -08:00
2012-01-25 17:44:30 -08:00
struct Entity {
const char* pattern;
int length;
char value;
};
static const int NUM_ENTITIES = 5;
static const Entity entities[NUM_ENTITIES] =
{
{ "quot", 4, '\"' },
{ "amp", 3, '&' },
{ "apos", 4, '\'' },
{ "lt", 2, '<' },
{ "gt", 2, '>' }
};
2012-01-14 18:08:12 -08:00
// --------- CharBuffer ----------- //
2011-12-28 19:42:49 -08:00
/*static*/ CharBuffer* CharBuffer::Construct( const char* in )
{
size_t len = strlen( in );
size_t size = len + sizeof( CharBuffer );
CharBuffer* cb = (CharBuffer*) malloc( size );
cb->length = len;
strcpy( cb->mem, in );
return cb;
}
/*static*/ void CharBuffer::Free( CharBuffer* cb )
{
free( cb );
}
const char* StrPair::GetStr()
{
if ( flags & NEEDS_FLUSH ) {
*end = 0;
2012-01-25 17:44:30 -08:00
flags ^= NEEDS_FLUSH;
2012-01-25 17:44:30 -08:00
if ( flags ) {
char* p = start;
char* q = start;
while( p < end ) {
2012-01-25 17:44:30 -08:00
if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == CR ) {
// CR-LF pair becomes LF
// CR alone becomes LF
// LF-CR becomes LF
if ( *(p+1) == LF ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
2012-01-25 17:44:30 -08:00
else if ( (flags & NEEDS_NEWLINE_NORMALIZATION) && *p == LF ) {
if ( *(p+1) == CR ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
2012-01-25 17:44:30 -08:00
else if ( (flags & NEEDS_ENTITY_PROCESSING) && *p == '&' ) {
int i=0;
for( i=0; i<NUM_ENTITIES; ++i ) {
if ( strncmp( p+1, entities[i].pattern, entities[i].length ) == 0
&& *(p+entities[i].length+1) == ';' )
{
// Found an entity convert;
*q = entities[i].value;
++q;
p += entities[i].length + 2;
break;
}
}
if ( i == NUM_ENTITIES ) {
// fixme: treat as error?
++p;
++q;
}
}
else {
*q = *p;
++p;
2012-01-23 11:42:06 -08:00
++q;
}
}
2012-01-25 17:44:30 -08:00
*q = 0;
}
flags = 0;
}
return start;
}
2012-01-18 17:43:40 -08:00
// --------- XMLBase ----------- //
char* XMLBase::ParseText( char* p, StrPair* pair, const char* endTag )
2012-01-18 17:43:40 -08:00
{
TIXMLASSERT( endTag && *endTag );
char* start = p;
char endChar = *endTag;
int length = strlen( endTag );
// Inner loop of text parsing.
while ( *p ) {
if ( *p == endChar && strncmp( p, endTag, length ) == 0 ) {
pair->Set( start, p, StrPair::NEEDS_ENTITY_PROCESSING | StrPair::NEEDS_NEWLINE_NORMALIZATION );
2012-01-23 11:42:06 -08:00
return p + length;
2012-01-18 17:43:40 -08:00
}
2012-01-23 11:42:06 -08:00
++p;
2012-01-18 17:43:40 -08:00
}
return p;
2012-01-18 17:43:40 -08:00
}
2012-01-20 12:55:24 -08:00
char* XMLBase::ParseName( char* p, StrPair* pair )
2012-01-18 17:43:40 -08:00
{
char* start = p;
start = p;
if ( !start || !(*start) ) {
return 0;
}
if ( !IsAlpha( *p ) ) {
return 0;
}
while( *p && (
IsAlphaNum( (unsigned char) *p )
|| *p == '_'
|| *p == '-'
|| *p == '.'
|| *p == ':' ))
{
++p;
}
if ( p > start ) {
pair->Set( start, p, 0 );
return p;
2012-01-18 17:43:40 -08:00
}
2012-01-20 11:27:56 -08:00
return 0;
2012-01-18 17:43:40 -08:00
}
char* XMLBase::Identify( XMLDocument* document, char* p, XMLNode** node )
{
XMLNode* returnNode = 0;
2012-01-23 15:32:10 -08:00
char* start = p;
2012-01-18 17:43:40 -08:00
p = XMLNode::SkipWhiteSpace( p );
2012-01-23 15:32:10 -08:00
if( !p || !*p )
2012-01-18 17:43:40 -08:00
{
return 0;
}
// What is this thing?
// - Elements start with a letter or underscore, but xml is reserved.
// - Comments: <!--
// - Decleration: <?xml
// - Everthing else is unknown to tinyxml.
//
static const char* xmlHeader = { "<?xml" };
static const char* commentHeader = { "<!--" };
static const char* dtdHeader = { "<!" };
static const char* cdataHeader = { "<![CDATA[" };
2012-01-18 17:55:48 -08:00
static const char* elementHeader = { "<" }; // and a header for everything else; check last.
2012-01-18 17:43:40 -08:00
static const int xmlHeaderLen = 5;
static const int commentHeaderLen = 4;
static const int dtdHeaderLen = 2;
static const int cdataHeaderLen = 9;
2012-01-18 17:55:48 -08:00
static const int elementHeaderLen = 1;
2012-01-18 17:43:40 -08:00
2012-01-18 17:55:48 -08:00
if ( StringEqual( p, commentHeader, commentHeaderLen ) ) {
2012-01-18 17:43:40 -08:00
returnNode = new XMLComment( document );
p += commentHeaderLen;
}
2012-01-18 17:55:48 -08:00
else if ( StringEqual( p, elementHeader, elementHeaderLen ) ) {
returnNode = new XMLElement( document );
p += elementHeaderLen;
}
2012-01-23 15:32:10 -08:00
// fixme: better text detection
else if ( (*p != '<') && IsAlphaNum( *p ) ) {
// fixme: this is filtering out empty text...should it?
returnNode = new XMLText( document );
p = start; // Back it up, all the text counts.
}
2012-01-18 17:43:40 -08:00
else {
TIXMLASSERT( 0 );
}
*node = returnNode;
return p;
}
// --------- XMLNode ----------- //
XMLNode::XMLNode( XMLDocument* doc ) :
document( doc ),
parent( 0 ),
isTextParent( false ),
firstChild( 0 ), lastChild( 0 ),
prev( 0 ), next( 0 )
2011-12-31 14:58:18 -08:00
{
}
XMLNode::~XMLNode()
{
2012-01-23 08:44:25 -08:00
//printf( "~XMLNode %x\n", this );
while( firstChild ) {
XMLNode* node = firstChild;
Unlink( node );
delete node;
}
2012-01-23 08:44:25 -08:00
}
void XMLNode::Unlink( XMLNode* child )
{
TIXMLASSERT( child->parent == this );
if ( child == firstChild )
firstChild = firstChild->next;
if ( child == lastChild )
lastChild = lastChild->prev;
if ( child->prev ) {
child->prev->next = child->next;
2012-01-18 17:43:40 -08:00
}
2012-01-23 08:44:25 -08:00
if ( child->next ) {
child->next->prev = child->prev;
2012-01-18 17:43:40 -08:00
}
2012-01-23 08:44:25 -08:00
child->parent = 0;
}
XMLNode* XMLNode::InsertEndChild( XMLNode* addThis )
{
if ( lastChild ) {
TIXMLASSERT( firstChild );
TIXMLASSERT( lastChild->next == 0 );
lastChild->next = addThis;
addThis->prev = lastChild;
lastChild = addThis;
addThis->parent = this;
2012-01-11 15:43:54 -08:00
addThis->next = 0;
}
else {
TIXMLASSERT( firstChild == 0 );
firstChild = lastChild = addThis;
addThis->parent = this;
addThis->prev = 0;
2012-01-11 15:43:54 -08:00
addThis->next = 0;
}
if ( addThis->ToText() ) {
SetTextParent();
}
2012-01-11 15:43:54 -08:00
return addThis;
}
2012-01-24 18:03:07 -08:00
void XMLNode::Print( XMLStreamer* streamer )
{
for( XMLNode* node = firstChild; node; node=node->next ) {
2012-01-24 18:03:07 -08:00
node->Print( streamer );
}
}
2012-01-18 17:55:48 -08:00
char* XMLNode::ParseDeep( char* p )
{
while( p && *p ) {
XMLNode* node = 0;
p = Identify( document, p, &node );
if ( p && node ) {
p = node->ParseDeep( p );
// FIXME: is it the correct closing element?
if ( node->IsClosingElement() ) {
delete node;
return p;
}
this->InsertEndChild( node );
}
}
return 0;
}
2012-01-23 15:32:10 -08:00
// --------- XMLText ---------- //
char* XMLText::ParseDeep( char* p )
{
p = ParseText( p, &value, "<" );
// consumes the end tag.
if ( p && *p ) {
return p-1;
}
return 0;
}
2012-01-24 18:03:07 -08:00
void XMLText::Print( XMLStreamer* streamer )
2012-01-23 15:32:10 -08:00
{
const char* v = value.GetStr();
2012-01-24 18:03:07 -08:00
streamer->PushText( v );
2012-01-23 15:32:10 -08:00
}
// --------- XMLComment ---------- //
XMLComment::XMLComment( XMLDocument* doc ) : XMLNode( doc )
{
}
2012-01-11 15:43:54 -08:00
XMLComment::~XMLComment()
{
2012-01-23 08:44:25 -08:00
//printf( "~XMLComment\n" );
}
2012-01-24 18:03:07 -08:00
void XMLComment::Print( XMLStreamer* streamer )
2012-01-11 15:43:54 -08:00
{
2012-01-24 18:03:07 -08:00
// XMLNode::Print( fp, depth );
// fprintf( fp, "<!--%s-->\n", value.GetStr() );
streamer->PushComment( value.GetStr() );
2012-01-11 15:43:54 -08:00
}
char* XMLComment::ParseDeep( char* p )
{
// Comment parses as text.
return ParseText( p, &value, "-->" );
2011-12-31 14:58:18 -08:00
}
2012-01-18 17:43:40 -08:00
// --------- XMLAttribute ---------- //
char* XMLAttribute::ParseDeep( char* p )
{
2012-01-23 13:29:35 -08:00
p = ParseText( p, &name, "=" );
if ( !p || !*p ) return 0;
2012-01-18 17:43:40 -08:00
char endTag[2] = { *p, 0 };
++p;
p = ParseText( p, &value, endTag );
if ( value.Empty() ) return 0;
2012-01-18 17:43:40 -08:00
return p;
}
2012-01-24 18:03:07 -08:00
void XMLAttribute::Print( XMLStreamer* streamer )
2012-01-18 17:55:48 -08:00
{
2012-01-23 13:29:35 -08:00
// fixme: sort out single vs. double quote
2012-01-24 18:03:07 -08:00
//fprintf( cfile, "%s=\"%s\"", name.GetStr(), value.GetStr() );
streamer->PushAttribute( name.GetStr(), value.GetStr() );
2012-01-18 17:55:48 -08:00
}
2012-01-18 17:43:40 -08:00
// --------- XMLElement ---------- //
XMLElement::XMLElement( XMLDocument* doc ) : XMLNode( doc ),
closing( false ),
rootAttribute( 0 ),
lastAttribute( 0 )
{
}
XMLElement::~XMLElement()
{
2012-01-23 08:44:25 -08:00
//printf( "~XMLElemen %x\n",this );
2012-01-18 17:43:40 -08:00
XMLAttribute* attribute = rootAttribute;
while( attribute ) {
XMLAttribute* next = attribute->next;
delete attribute;
attribute = next;
}
}
char* XMLElement::ParseAttributes( char* p, bool* closedElement )
2012-01-18 17:43:40 -08:00
{
const char* start = p;
*closedElement = false;
2012-01-18 17:43:40 -08:00
// Read the attributes.
while( p ) {
p = SkipWhiteSpace( p );
if ( !p || !(*p) ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, name.GetStr() );
2012-01-18 17:43:40 -08:00
return 0;
}
// attribute.
2012-01-23 13:29:35 -08:00
if ( IsAlpha( *p ) ) {
2012-01-18 17:43:40 -08:00
XMLAttribute* attrib = new XMLAttribute( this );
p = attrib->ParseDeep( p );
if ( !p ) {
delete attrib;
document->SetError( XMLDocument::ERROR_PARSING_ATTRIBUTE, start, p );
2012-01-18 17:43:40 -08:00
return 0;
}
if ( rootAttribute ) {
TIXMLASSERT( lastAttribute );
lastAttribute->next = attrib;
lastAttribute = attrib;
}
else {
rootAttribute = lastAttribute = attrib;
}
}
// end of the tag
2012-01-18 17:43:40 -08:00
else if ( *p == '/' && *(p+1) == '>' ) {
if ( closing ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
*closedElement = true;
2012-01-18 17:43:40 -08:00
return p+2; // done; sealed element.
}
// end of the tag
2012-01-18 17:43:40 -08:00
else if ( *p == '>' ) {
++p;
break;
}
else {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
2012-01-18 17:43:40 -08:00
}
return p;
}
2012-01-18 17:43:40 -08:00
//
// <ele></ele>
// <ele>foo<b>bar</b></ele>
//
char* XMLElement::ParseDeep( char* p )
{
// Read the element name.
p = SkipWhiteSpace( p );
if ( !p ) return 0;
const char* start = p;
// The closing element is the </element> form. It is
// parsed just like a regular element then deleted from
// the DOM.
if ( *p == '/' ) {
closing = true;
++p;
2012-01-18 17:43:40 -08:00
}
p = ParseName( p, &name );
if ( name.Empty() ) return 0;
bool elementClosed=false;
p = ParseAttributes( p, &elementClosed );
if ( !p || !*p || elementClosed || closing )
return p;
p = XMLNode::ParseDeep( p );
return p;
2012-01-18 17:43:40 -08:00
}
2012-01-24 18:03:07 -08:00
void XMLElement::Print( XMLStreamer* streamer )
2012-01-18 17:55:48 -08:00
{
2012-01-24 18:03:07 -08:00
//if ( !parent || !parent->IsTextParent() ) {
// PrintSpace( cfile, depth );
//}
//fprintf( cfile, "<%s", Name() );
streamer->OpenElement( Name(), IsTextParent() );
2012-01-18 17:55:48 -08:00
for( XMLAttribute* attrib=rootAttribute; attrib; attrib=attrib->next ) {
2012-01-24 18:03:07 -08:00
//fprintf( cfile, " " );
attrib->Print( streamer );
2012-01-18 17:55:48 -08:00
}
2012-01-24 18:03:07 -08:00
for( XMLNode* node=firstChild; node; node=node->next ) {
node->Print( streamer );
}
streamer->CloseElement();
2012-01-18 17:55:48 -08:00
}
// --------- XMLDocument ----------- //
XMLDocument::XMLDocument() :
XMLNode( this ),
2011-12-28 19:42:49 -08:00
charBuffer( 0 )
{
}
2011-12-28 14:36:55 -08:00
XMLDocument::~XMLDocument()
{
}
bool XMLDocument::Parse( const char* p )
{
2012-01-11 15:43:54 -08:00
charBuffer = CharBuffer::Construct( p );
XMLNode* node = 0;
char* q = ParseDeep( charBuffer->mem );
return true;
}
2012-01-24 18:03:07 -08:00
void XMLDocument::Print( XMLStreamer* streamer )
{
2012-01-24 18:03:07 -08:00
XMLStreamer stdStreamer( stdout );
if ( !streamer )
streamer = &stdStreamer;
for( XMLNode* node = firstChild; node; node=node->next ) {
2012-01-24 18:03:07 -08:00
node->Print( streamer );
2012-01-11 15:43:54 -08:00
}
}
void XMLDocument::SetError( int error, const char* str1, const char* str2 )
{
printf( "ERROR: id=%d '%s' '%s'\n", error, str1, str2 );
}
2012-01-24 18:03:07 -08:00
StringStack::StringStack()
{
*pool = 0;
mem = pool;
2012-01-24 18:03:07 -08:00
inUse = 1; // always has a null
allocated = INIT;
nPositive = 0;
}
StringStack::~StringStack()
{
if ( mem != pool ) {
delete [] mem;
}
}
2012-01-24 18:03:07 -08:00
void StringStack::Push( const char* str ) {
int needed = strlen( str ) + 1;
if ( needed > 1 )
nPositive++;
if ( inUse+needed > allocated ) {
// fixme: power of 2
// less stupid allocation
int more = inUse+needed + 1000;
char* newMem = new char[more];
memcpy( newMem, mem, inUse );
if ( mem != pool ) {
delete [] mem;
}
2012-01-24 18:03:07 -08:00
mem = newMem;
}
strcpy( mem+inUse, str );
inUse += needed;
}
const char* StringStack::Pop() {
TIXMLASSERT( inUse > 1 );
const char* p = mem+inUse-2;
if ( *p ) {
nPositive--;
}
while( *p ) { // stack starts with a null, don't need to check for 'mem'
TIXMLASSERT( p > mem );
--p;
}
inUse = p-mem+1;
return p+1;
}
XMLStreamer::XMLStreamer( FILE* file ) : fp( file ), depth( 0 ), elementJustOpened( false )
{
2012-01-25 17:50:25 -08:00
for( int i=0; i<ENTITY_RANGE; ++i ) {
entityFlag[i] = false;
}
for( int i=0; i<NUM_ENTITIES; ++i ) {
TIXMLASSERT( entities[i].value < ENTITY_RANGE );
if ( entities[i].value < ENTITY_RANGE ) {
entityFlag[ entities[i].value ] = true;
}
}
2012-01-24 18:03:07 -08:00
}
void XMLStreamer::PrintSpace( int depth )
{
for( int i=0; i<depth; ++i ) {
fprintf( fp, " " );
}
}
2012-01-25 17:50:25 -08:00
void XMLStreamer::PrintString( const char* )
{
}
2012-01-24 18:03:07 -08:00
void XMLStreamer::OpenElement( const char* name, bool textParent )
{
if ( elementJustOpened ) {
SealElement();
}
if ( text.NumPositive() == 0 ) {
PrintSpace( depth );
}
2012-01-24 18:03:07 -08:00
stack.Push( name );
text.Push( textParent ? "T" : "" );
fprintf( fp, "<%s", name );
elementJustOpened = true;
++depth;
}
void XMLStreamer::PushAttribute( const char* name, const char* value )
{
TIXMLASSERT( elementJustOpened );
fprintf( fp, " %s=\"%s\"", name, value );
}
void XMLStreamer::CloseElement()
{
--depth;
const char* name = stack.Pop();
int wasPositive = text.NumPositive();
2012-01-24 18:03:07 -08:00
text.Pop();
if ( elementJustOpened ) {
fprintf( fp, "/>" );
if ( text.NumPositive() == 0 ) {
fprintf( fp, "\n" );
}
}
else {
if ( wasPositive == 0 ) {
PrintSpace( depth );
}
2012-01-24 18:03:07 -08:00
fprintf( fp, "</%s>", name );
if ( text.NumPositive() == 0 ) {
fprintf( fp, "\n" );
}
}
elementJustOpened = false;
}
void XMLStreamer::SealElement()
{
elementJustOpened = false;
fprintf( fp, ">" );
if ( text.NumPositive() == 0 ) {
fprintf( fp, "\n" );
}
}
void XMLStreamer::PushText( const char* text )
{
if ( elementJustOpened ) {
SealElement();
}
fprintf( fp, "%s", text );
}
void XMLStreamer::PushComment( const char* comment )
{
if ( elementJustOpened ) {
SealElement();
}
PrintSpace( depth );
fprintf( fp, "<!--%s-->\n", comment );
}