tinyxml2/tinyxml2.cpp

518 lines
10 KiB
C++
Raw Normal View History

2011-12-29 03:42:49 +00:00
#include "tinyxml2.h"
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
2011-12-31 22:58:18 +00:00
#include <ctype.h>
2011-12-29 03:42:49 +00:00
using namespace tinyxml2;
static const char LINE_FEED = (char)0x0a; // all line endings are normalized to LF
2012-01-15 02:08:12 +00:00
static const char LF = LINE_FEED;
static const char CARRIAGE_RETURN = (char)0x0d; // CR gets filtered out
static const char CR = CARRIAGE_RETURN;
static const char SINGLE_QUOTE = '\'';
static const char DOUBLE_QUOTE = '\"';
2012-01-15 02:08:12 +00:00
// --------- CharBuffer ----------- //
2011-12-29 03:42:49 +00:00
/*static*/ CharBuffer* CharBuffer::Construct( const char* in )
{
size_t len = strlen( in );
size_t size = len + sizeof( CharBuffer );
CharBuffer* cb = (CharBuffer*) malloc( size );
cb->length = len;
strcpy( cb->mem, in );
return cb;
}
/*static*/ void CharBuffer::Free( CharBuffer* cb )
{
free( cb );
}
const char* StrPair::GetStr()
{
if ( flags & NEEDS_FLUSH ) {
*end = 0;
if ( flags & ( NEEDS_ENTITY_PROCESSING | NEEDS_NEWLINE_NORMALIZATION ) ) {
char* p = start;
char* q = start;
while( p < end ) {
if ( *p == CR ) {
// CR-LF pair becomes LF
// CR alone becomes LF
// LF-CR becomes LF
if ( *(p+1) == LF ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
else if ( *p == LF ) {
if ( *(p+1) == CR ) {
p += 2;
}
else {
++p;
}
*q = LF;
}
else {
*q = *p;
++p;
2012-01-23 19:42:06 +00:00
++q;
}
}
}
flags = 0;
}
return start;
}
2012-01-19 01:43:40 +00:00
// --------- XMLBase ----------- //
char* XMLBase::ParseText( char* p, StrPair* pair, const char* endTag )
2012-01-19 01:43:40 +00:00
{
TIXMLASSERT( endTag && *endTag );
char* start = p;
char endChar = *endTag;
int length = strlen( endTag );
// Inner loop of text parsing.
while ( *p ) {
if ( *p == endChar && strncmp( p, endTag, length ) == 0 ) {
pair->Set( start, p, StrPair::NEEDS_ENTITY_PROCESSING | StrPair::NEEDS_NEWLINE_NORMALIZATION );
2012-01-23 19:42:06 +00:00
return p + length;
2012-01-19 01:43:40 +00:00
}
2012-01-23 19:42:06 +00:00
++p;
2012-01-19 01:43:40 +00:00
}
return p;
2012-01-19 01:43:40 +00:00
}
2012-01-20 20:55:24 +00:00
char* XMLBase::ParseName( char* p, StrPair* pair )
2012-01-19 01:43:40 +00:00
{
char* start = p;
start = p;
if ( !start || !(*start) ) {
return 0;
}
if ( !IsAlpha( *p ) ) {
return 0;
}
while( *p && (
IsAlphaNum( (unsigned char) *p )
|| *p == '_'
|| *p == '-'
|| *p == '.'
|| *p == ':' ))
{
++p;
}
if ( p > start ) {
pair->Set( start, p, 0 );
return p;
2012-01-19 01:43:40 +00:00
}
2012-01-20 19:27:56 +00:00
return 0;
2012-01-19 01:43:40 +00:00
}
char* XMLBase::Identify( XMLDocument* document, char* p, XMLNode** node )
{
XMLNode* returnNode = 0;
2012-01-23 23:32:10 +00:00
char* start = p;
2012-01-19 01:43:40 +00:00
p = XMLNode::SkipWhiteSpace( p );
2012-01-23 23:32:10 +00:00
if( !p || !*p )
2012-01-19 01:43:40 +00:00
{
return 0;
}
// What is this thing?
// - Elements start with a letter or underscore, but xml is reserved.
// - Comments: <!--
// - Decleration: <?xml
// - Everthing else is unknown to tinyxml.
//
static const char* xmlHeader = { "<?xml" };
static const char* commentHeader = { "<!--" };
static const char* dtdHeader = { "<!" };
static const char* cdataHeader = { "<![CDATA[" };
2012-01-19 01:55:48 +00:00
static const char* elementHeader = { "<" }; // and a header for everything else; check last.
2012-01-19 01:43:40 +00:00
static const int xmlHeaderLen = 5;
static const int commentHeaderLen = 4;
static const int dtdHeaderLen = 2;
static const int cdataHeaderLen = 9;
2012-01-19 01:55:48 +00:00
static const int elementHeaderLen = 1;
2012-01-19 01:43:40 +00:00
2012-01-19 01:55:48 +00:00
if ( StringEqual( p, commentHeader, commentHeaderLen ) ) {
2012-01-19 01:43:40 +00:00
returnNode = new XMLComment( document );
p += commentHeaderLen;
}
2012-01-19 01:55:48 +00:00
else if ( StringEqual( p, elementHeader, elementHeaderLen ) ) {
returnNode = new XMLElement( document );
p += elementHeaderLen;
}
2012-01-23 23:32:10 +00:00
// fixme: better text detection
else if ( (*p != '<') && IsAlphaNum( *p ) ) {
// fixme: this is filtering out empty text...should it?
returnNode = new XMLText( document );
p = start; // Back it up, all the text counts.
}
2012-01-19 01:43:40 +00:00
else {
TIXMLASSERT( 0 );
}
*node = returnNode;
return p;
}
// --------- XMLNode ----------- //
XMLNode::XMLNode( XMLDocument* doc ) :
document( doc ),
parent( 0 ),
firstChild( 0 ), lastChild( 0 ),
prev( 0 ), next( 0 )
2011-12-31 22:58:18 +00:00
{
}
XMLNode::~XMLNode()
{
2012-01-23 16:44:25 +00:00
//printf( "~XMLNode %x\n", this );
while( firstChild ) {
XMLNode* node = firstChild;
Unlink( node );
delete node;
}
2012-01-23 16:44:25 +00:00
}
void XMLNode::Unlink( XMLNode* child )
{
TIXMLASSERT( child->parent == this );
if ( child == firstChild )
firstChild = firstChild->next;
if ( child == lastChild )
lastChild = lastChild->prev;
if ( child->prev ) {
child->prev->next = child->next;
2012-01-19 01:43:40 +00:00
}
2012-01-23 16:44:25 +00:00
if ( child->next ) {
child->next->prev = child->prev;
2012-01-19 01:43:40 +00:00
}
2012-01-23 16:44:25 +00:00
child->parent = 0;
}
XMLNode* XMLNode::InsertEndChild( XMLNode* addThis )
{
if ( lastChild ) {
TIXMLASSERT( firstChild );
TIXMLASSERT( lastChild->next == 0 );
lastChild->next = addThis;
addThis->prev = lastChild;
lastChild = addThis;
addThis->parent = this;
2012-01-11 23:43:54 +00:00
addThis->next = 0;
}
else {
TIXMLASSERT( firstChild == 0 );
firstChild = lastChild = addThis;
addThis->parent = this;
addThis->prev = 0;
2012-01-11 23:43:54 +00:00
addThis->next = 0;
}
return addThis;
}
void XMLNode::Print( FILE* fp, int depth )
{
for( XMLNode* node = firstChild; node; node=node->next ) {
node->Print( fp, depth );
}
}
2012-01-19 01:55:48 +00:00
void XMLNode::PrintSpace( FILE* fp, int depth )
2012-01-11 23:43:54 +00:00
{
for( int i=0; i<depth; ++i ) {
fprintf( fp, " " );
2011-12-31 22:58:18 +00:00
}
}
2012-01-23 23:32:10 +00:00
// --------- XMLText ---------- //
char* XMLText::ParseDeep( char* p )
{
p = ParseText( p, &value, "<" );
// consumes the end tag.
if ( p && *p ) {
return p-1;
}
return 0;
}
void XMLText::Print( FILE* cfile, int depth )
{
fprintf( cfile, value.GetStr() );
}
// --------- XMLComment ---------- //
XMLComment::XMLComment( XMLDocument* doc ) : XMLNode( doc )
{
}
2012-01-11 23:43:54 +00:00
XMLComment::~XMLComment()
{
2012-01-23 16:44:25 +00:00
//printf( "~XMLComment\n" );
}
2012-01-11 23:43:54 +00:00
void XMLComment::Print( FILE* fp, int depth )
{
XMLNode::Print( fp, depth );
2012-01-23 19:42:06 +00:00
fprintf( fp, "<!--%s-->\n", value.GetStr() );
2012-01-11 23:43:54 +00:00
}
char* XMLComment::ParseDeep( char* p )
{
// Comment parses as text.
return ParseText( p, &value, "-->" );
2011-12-31 22:58:18 +00:00
}
2012-01-19 01:43:40 +00:00
// --------- XMLAttribute ---------- //
char* XMLAttribute::ParseDeep( char* p )
{
2012-01-23 21:29:35 +00:00
p = ParseText( p, &name, "=" );
if ( !p || !*p ) return 0;
2012-01-19 01:43:40 +00:00
char endTag[2] = { *p, 0 };
++p;
p = ParseText( p, &value, endTag );
if ( value.Empty() ) return 0;
2012-01-19 01:43:40 +00:00
return p;
}
2012-01-19 01:55:48 +00:00
void XMLAttribute::Print( FILE* cfile )
{
2012-01-23 21:29:35 +00:00
// fixme: sort out single vs. double quote
fprintf( cfile, "%s=\"%s\"", name.GetStr(), value.GetStr() );
2012-01-19 01:55:48 +00:00
}
2012-01-19 01:43:40 +00:00
// --------- XMLElement ---------- //
XMLElement::XMLElement( XMLDocument* doc ) : XMLNode( doc ),
closing( false ),
rootAttribute( 0 ),
lastAttribute( 0 )
{
}
XMLElement::~XMLElement()
{
2012-01-23 16:44:25 +00:00
//printf( "~XMLElemen %x\n",this );
2012-01-19 01:43:40 +00:00
XMLAttribute* attribute = rootAttribute;
while( attribute ) {
XMLAttribute* next = attribute->next;
delete attribute;
attribute = next;
}
}
char* XMLElement::ParseDeep( char* p )
{
// Read the element name.
p = SkipWhiteSpace( p );
if ( !p ) return 0;
const char* start = p;
// The closing element is the </element> form. It is
// parsed just like a regular element then deleted from
// the DOM.
if ( *p == '/' ) {
closing = true;
++p;
}
p = ParseName( p, &name );
if ( name.Empty() ) return 0;
2012-01-19 01:43:40 +00:00
// Read the attributes.
while( p ) {
p = SkipWhiteSpace( p );
if ( !p || !(*p) ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, name.GetStr() );
2012-01-19 01:43:40 +00:00
return 0;
}
// attribute.
2012-01-23 21:29:35 +00:00
if ( IsAlpha( *p ) ) {
2012-01-19 01:43:40 +00:00
XMLAttribute* attrib = new XMLAttribute( this );
p = attrib->ParseDeep( p );
if ( !p ) {
delete attrib;
document->SetError( XMLDocument::ERROR_PARSING_ATTRIBUTE, start, p );
2012-01-19 01:43:40 +00:00
return 0;
}
if ( rootAttribute ) {
TIXMLASSERT( lastAttribute );
lastAttribute->next = attrib;
lastAttribute = attrib;
}
else {
rootAttribute = lastAttribute = attrib;
}
}
// end of the tag
2012-01-19 01:43:40 +00:00
else if ( *p == '/' && *(p+1) == '>' ) {
if ( closing ) {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
return p+2; // done; sealed element.
}
// end of the tag
2012-01-19 01:43:40 +00:00
else if ( *p == '>' ) {
++p;
break;
}
else {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
return 0;
}
2012-01-19 01:43:40 +00:00
}
while( p && *p ) {
XMLNode* node = 0;
p = Identify( document, p, &node );
if ( p && node ) {
p = node->ParseDeep( p );
2012-01-19 01:43:40 +00:00
XMLElement* element = node->ToElement();
if ( element && element->Closing() ) {
if ( StringEqual( element->Name(), this->Name() ) ) {
// All good, this is closing tag.
delete node;
}
else {
document->SetError( XMLDocument::ERROR_PARSING_ELEMENT, start, p );
delete node;
p = 0;
2012-01-19 01:43:40 +00:00
}
return p;
}
else {
this->InsertEndChild( node );
}
}
}
return 0;
}
2012-01-19 01:55:48 +00:00
void XMLElement::Print( FILE* cfile, int depth )
{
PrintSpace( cfile, depth );
fprintf( cfile, "<%s", Name() );
for( XMLAttribute* attrib=rootAttribute; attrib; attrib=attrib->next ) {
fprintf( cfile, " " );
attrib->Print( cfile );
}
if ( firstChild ) {
2012-01-23 23:32:10 +00:00
// fixme: once text is on, it should stay on, and not use newlines.
bool useNewline = firstChild->ToText() == 0;
fprintf( cfile, ">", Name() );
if ( useNewline ) fprintf( cfile, "\n" );
2012-01-19 01:55:48 +00:00
for( XMLNode* node=firstChild; node; node=node->next ) {
node->Print( cfile, depth+1 );
}
2012-01-23 23:32:10 +00:00
2012-01-23 19:42:06 +00:00
fprintf( cfile, "</%s>\n", Name() );
2012-01-23 23:32:10 +00:00
// fixme: see note above
//if ( useNewline ) fprintf( cfile, "\n" );
2012-01-19 01:55:48 +00:00
}
else {
fprintf( cfile, "/>\n" );
}
}
// --------- XMLDocument ----------- //
2011-12-29 03:42:49 +00:00
XMLDocument::XMLDocument() :
charBuffer( 0 )
{
root = new XMLNode( this );
2011-12-29 03:42:49 +00:00
}
2011-12-28 22:36:55 +00:00
XMLDocument::~XMLDocument()
{
delete root;
delete charBuffer;
}
bool XMLDocument::Parse( const char* p )
{
2012-01-11 23:43:54 +00:00
charBuffer = CharBuffer::Construct( p );
XMLNode* node = 0;
2012-01-23 21:29:35 +00:00
// fixme: clean up
2012-01-19 01:43:40 +00:00
char* q = Identify( this, charBuffer->mem, &node );
2012-01-23 19:42:06 +00:00
while ( node ) {
2012-01-19 01:55:48 +00:00
root->InsertEndChild( node );
2012-01-23 19:42:06 +00:00
q = node->ParseDeep( q );
node = 0;
if ( q && *q ) {
q = Identify( this, q, &node );
}
2012-01-19 01:55:48 +00:00
}
return false;
}
2012-01-11 23:43:54 +00:00
void XMLDocument::Print( FILE* fp, int depth )
{
2012-01-11 23:43:54 +00:00
for( XMLNode* node = root->firstChild; node; node=node->next ) {
node->Print( fp, depth );
}
}