1 | /* |
---|
2 | www.sourceforge.net/projects/tinyxml |
---|
3 | Original code (2.0 and earlier )copyright (c) 2000-2002 Lee Thomason (www.grinninglizard.com) |
---|
4 | |
---|
5 | This software is provided 'as-is', without any express or implied |
---|
6 | warranty. In no event will the authors be held liable for any |
---|
7 | damages arising from the use of this software. |
---|
8 | |
---|
9 | Permission is granted to anyone to use this software for any |
---|
10 | purpose, including commercial applications, and to alter it and |
---|
11 | redistribute it freely, subject to the following restrictions: |
---|
12 | |
---|
13 | 1. The origin of this software must not be misrepresented; you must |
---|
14 | not claim that you wrote the original software. If you use this |
---|
15 | software in a product, an acknowledgment in the product documentation |
---|
16 | would be appreciated but is not required. |
---|
17 | |
---|
18 | 2. Altered source versions must be plainly marked as such, and |
---|
19 | must not be misrepresented as being the original software. |
---|
20 | |
---|
21 | 3. This notice may not be removed or altered from any source |
---|
22 | distribution. |
---|
23 | */ |
---|
24 | |
---|
25 | #include "tinyxml.h" |
---|
26 | #include <ctype.h> |
---|
27 | |
---|
28 | //#define DEBUG_PARSER |
---|
29 | |
---|
30 | // Note tha "PutString" hardcodes the same list. This |
---|
31 | // is less flexible than it appears. Changing the entries |
---|
32 | // or order will break putstring. |
---|
33 | TiXmlBase::Entity TiXmlBase::entity[ NUM_ENTITY ] = |
---|
34 | { |
---|
35 | { "&", 5, '&' }, |
---|
36 | { "<", 4, '<' }, |
---|
37 | { ">", 4, '>' }, |
---|
38 | { """, 6, '\"' }, |
---|
39 | { "'", 6, '\'' } |
---|
40 | }; |
---|
41 | |
---|
42 | |
---|
43 | const char* TiXmlBase::SkipWhiteSpace( const char* p ) |
---|
44 | { |
---|
45 | if ( !p || !*p ) |
---|
46 | { |
---|
47 | return 0; |
---|
48 | } |
---|
49 | while ( p && *p ) |
---|
50 | { |
---|
51 | if ( isspace( *p ) || *p == '\n' || *p =='\r' ) // Still using old rules for white space. |
---|
52 | ++p; |
---|
53 | else |
---|
54 | break; |
---|
55 | } |
---|
56 | |
---|
57 | return p; |
---|
58 | } |
---|
59 | |
---|
60 | #ifdef TIXML_USE_STL |
---|
61 | /*static*/ bool TiXmlBase::StreamWhiteSpace( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
62 | { |
---|
63 | for( ;; ) |
---|
64 | { |
---|
65 | if ( !in->good() ) return false; |
---|
66 | |
---|
67 | int c = in->peek(); |
---|
68 | if ( !IsWhiteSpace( c ) ) |
---|
69 | return true; |
---|
70 | *tag += in->get(); |
---|
71 | } |
---|
72 | } |
---|
73 | |
---|
74 | /*static*/ bool TiXmlBase::StreamTo( TIXML_ISTREAM * in, int character, TIXML_STRING * tag ) |
---|
75 | { |
---|
76 | while ( in->good() ) |
---|
77 | { |
---|
78 | int c = in->peek(); |
---|
79 | if ( c == character ) |
---|
80 | return true; |
---|
81 | |
---|
82 | in->get(); |
---|
83 | *tag += c; |
---|
84 | } |
---|
85 | return false; |
---|
86 | } |
---|
87 | #endif |
---|
88 | |
---|
89 | const char* TiXmlBase::ReadName( const char* p, TIXML_STRING * name ) |
---|
90 | { |
---|
91 | *name = ""; |
---|
92 | assert( p ); |
---|
93 | |
---|
94 | // Names start with letters or underscores. |
---|
95 | // After that, they can be letters, underscores, numbers, |
---|
96 | // hyphens, or colons. (Colons are valid ony for namespaces, |
---|
97 | // but tinyxml can't tell namespaces from names.) |
---|
98 | if ( p && *p |
---|
99 | && ( isalpha( (unsigned char) *p ) || *p == '_' ) ) |
---|
100 | { |
---|
101 | while( p && *p |
---|
102 | && ( isalnum( (unsigned char ) *p ) |
---|
103 | || *p == '_' |
---|
104 | || *p == '-' |
---|
105 | || *p == ':' ) ) |
---|
106 | { |
---|
107 | (*name) += *p; |
---|
108 | ++p; |
---|
109 | } |
---|
110 | return p; |
---|
111 | } |
---|
112 | return 0; |
---|
113 | } |
---|
114 | |
---|
115 | const char* TiXmlBase::GetEntity( const char* p, char* value ) |
---|
116 | { |
---|
117 | // Presume an entity, and pull it out. |
---|
118 | TIXML_STRING ent; |
---|
119 | int i; |
---|
120 | |
---|
121 | // Ignore the &#x entities. |
---|
122 | if ( strncmp( "&#x", p, 3 ) == 0 |
---|
123 | && *(p+3) |
---|
124 | && *(p+4) ) |
---|
125 | { |
---|
126 | *value = 0; |
---|
127 | |
---|
128 | if ( isalpha( *(p+3) ) ) *value += ( tolower( *(p+3) ) - 'a' + 10 ) * 16; |
---|
129 | else *value += ( *(p+3) - '0' ) * 16; |
---|
130 | |
---|
131 | if ( isalpha( *(p+4) ) ) *value += ( tolower( *(p+4) ) - 'a' + 10 ); |
---|
132 | else *value += ( *(p+4) - '0' ); |
---|
133 | |
---|
134 | return p+6; |
---|
135 | } |
---|
136 | |
---|
137 | // Now try to match it. |
---|
138 | for( i=0; i<NUM_ENTITY; ++i ) |
---|
139 | { |
---|
140 | if ( strncmp( entity[i].str, p, entity[i].strLength ) == 0 ) |
---|
141 | { |
---|
142 | assert( strlen( entity[i].str ) == entity[i].strLength ); |
---|
143 | *value = entity[i].chr; |
---|
144 | return ( p + entity[i].strLength ); |
---|
145 | } |
---|
146 | } |
---|
147 | |
---|
148 | // So it wasn't an entity, its unrecognized, or something like that. |
---|
149 | *value = *p; // Don't put back the last one, since we return it! |
---|
150 | return p+1; |
---|
151 | } |
---|
152 | |
---|
153 | |
---|
154 | bool TiXmlBase::StringEqual( const char* p, |
---|
155 | const char* tag, |
---|
156 | bool ignoreCase ) |
---|
157 | { |
---|
158 | assert( p ); |
---|
159 | if ( !p || !*p ) |
---|
160 | { |
---|
161 | assert( 0 ); |
---|
162 | return false; |
---|
163 | } |
---|
164 | |
---|
165 | if ( tolower( *p ) == tolower( *tag ) ) |
---|
166 | { |
---|
167 | const char* q = p; |
---|
168 | |
---|
169 | if (ignoreCase) |
---|
170 | { |
---|
171 | while ( *q && *tag && *q == *tag ) |
---|
172 | { |
---|
173 | ++q; |
---|
174 | ++tag; |
---|
175 | } |
---|
176 | |
---|
177 | if ( *tag == 0 ) // Have we found the end of the tag, and everything equal? |
---|
178 | { |
---|
179 | return true; |
---|
180 | } |
---|
181 | } |
---|
182 | else |
---|
183 | { |
---|
184 | while ( *q && *tag && tolower( *q ) == tolower( *tag ) ) |
---|
185 | { |
---|
186 | ++q; |
---|
187 | ++tag; |
---|
188 | } |
---|
189 | |
---|
190 | if ( *tag == 0 ) |
---|
191 | { |
---|
192 | return true; |
---|
193 | } |
---|
194 | } |
---|
195 | } |
---|
196 | return false; |
---|
197 | } |
---|
198 | |
---|
199 | const char* TiXmlBase::ReadText( const char* p, |
---|
200 | TIXML_STRING * text, |
---|
201 | bool trimWhiteSpace, |
---|
202 | const char* endTag, |
---|
203 | bool caseInsensitive ) |
---|
204 | { |
---|
205 | *text = ""; |
---|
206 | if ( !trimWhiteSpace // certain tags always keep whitespace |
---|
207 | || !condenseWhiteSpace ) // if true, whitespace is always kept |
---|
208 | { |
---|
209 | // Keep all the white space. |
---|
210 | while ( p && *p |
---|
211 | && !StringEqual( p, endTag, caseInsensitive ) |
---|
212 | ) |
---|
213 | { |
---|
214 | char c; |
---|
215 | p = GetChar( p, &c ); |
---|
216 | (* text) += c; |
---|
217 | } |
---|
218 | } |
---|
219 | else |
---|
220 | { |
---|
221 | bool whitespace = false; |
---|
222 | |
---|
223 | // Remove leading white space: |
---|
224 | p = SkipWhiteSpace( p ); |
---|
225 | while ( p && *p |
---|
226 | && !StringEqual( p, endTag, caseInsensitive ) ) |
---|
227 | { |
---|
228 | if ( *p == '\r' || *p == '\n' ) |
---|
229 | { |
---|
230 | whitespace = true; |
---|
231 | ++p; |
---|
232 | } |
---|
233 | else if ( isspace( *p ) ) |
---|
234 | { |
---|
235 | whitespace = true; |
---|
236 | ++p; |
---|
237 | } |
---|
238 | else |
---|
239 | { |
---|
240 | // If we've found whitespace, add it before the |
---|
241 | // new character. Any whitespace just becomes a space. |
---|
242 | if ( whitespace ) |
---|
243 | { |
---|
244 | (* text) += ' '; |
---|
245 | whitespace = false; |
---|
246 | } |
---|
247 | char c; |
---|
248 | p = GetChar( p, &c ); |
---|
249 | (* text) += c; |
---|
250 | } |
---|
251 | } |
---|
252 | } |
---|
253 | return p + strlen( endTag ); |
---|
254 | } |
---|
255 | |
---|
256 | #ifdef TIXML_USE_STL |
---|
257 | |
---|
258 | void TiXmlDocument::StreamIn( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
259 | { |
---|
260 | // The basic issue with a document is that we don't know what we're |
---|
261 | // streaming. Read something presumed to be a tag (and hope), then |
---|
262 | // identify it, and call the appropriate stream method on the tag. |
---|
263 | // |
---|
264 | // This "pre-streaming" will never read the closing ">" so the |
---|
265 | // sub-tag can orient itself. |
---|
266 | |
---|
267 | if ( !StreamTo( in, '<', tag ) ) |
---|
268 | { |
---|
269 | SetError( TIXML_ERROR_PARSING_EMPTY ); |
---|
270 | return; |
---|
271 | } |
---|
272 | |
---|
273 | while ( in->good() ) |
---|
274 | { |
---|
275 | size_t tagIndex = tag->length(); |
---|
276 | while ( in->good() && in->peek() != '>' ) |
---|
277 | { |
---|
278 | int c = in->get(); |
---|
279 | (*tag) += (char) c; |
---|
280 | } |
---|
281 | |
---|
282 | if ( in->good() ) |
---|
283 | { |
---|
284 | // We now have something we presume to be a node of |
---|
285 | // some sort. Identify it, and call the node to |
---|
286 | // continue streaming. |
---|
287 | TiXmlNode* node = Identify( tag->c_str() + tagIndex ); |
---|
288 | |
---|
289 | if ( node ) |
---|
290 | { |
---|
291 | node->StreamIn( in, tag ); |
---|
292 | bool isElement = node->ToElement() != 0; |
---|
293 | delete node; |
---|
294 | node = 0; |
---|
295 | |
---|
296 | // If this is the root element, we're done. Parsing will be |
---|
297 | // done by the >> operator. |
---|
298 | if ( isElement ) |
---|
299 | { |
---|
300 | return; |
---|
301 | } |
---|
302 | } |
---|
303 | else |
---|
304 | { |
---|
305 | SetError( TIXML_ERROR ); |
---|
306 | return; |
---|
307 | } |
---|
308 | } |
---|
309 | } |
---|
310 | // We should have returned sooner. |
---|
311 | SetError( TIXML_ERROR ); |
---|
312 | } |
---|
313 | |
---|
314 | #endif |
---|
315 | |
---|
316 | const char* TiXmlDocument::Parse( const char* p ) |
---|
317 | { |
---|
318 | // Parse away, at the document level. Since a document |
---|
319 | // contains nothing but other tags, most of what happens |
---|
320 | // here is skipping white space. |
---|
321 | // |
---|
322 | // In this variant (as opposed to stream and Parse) we |
---|
323 | // read everything we can. |
---|
324 | |
---|
325 | |
---|
326 | if ( !p || !*p ) |
---|
327 | { |
---|
328 | SetError( TIXML_ERROR_DOCUMENT_EMPTY ); |
---|
329 | return false; |
---|
330 | } |
---|
331 | |
---|
332 | p = SkipWhiteSpace( p ); |
---|
333 | if ( !p ) |
---|
334 | { |
---|
335 | SetError( TIXML_ERROR_DOCUMENT_EMPTY ); |
---|
336 | return false; |
---|
337 | } |
---|
338 | |
---|
339 | while ( p && *p ) |
---|
340 | { |
---|
341 | TiXmlNode* node = Identify( p ); |
---|
342 | if ( node ) |
---|
343 | { |
---|
344 | p = node->Parse( p ); |
---|
345 | LinkEndChild( node ); |
---|
346 | } |
---|
347 | else |
---|
348 | { |
---|
349 | break; |
---|
350 | } |
---|
351 | p = SkipWhiteSpace( p ); |
---|
352 | } |
---|
353 | // All is well. |
---|
354 | return p; |
---|
355 | } |
---|
356 | |
---|
357 | |
---|
358 | TiXmlNode* TiXmlNode::Identify( const char* p ) |
---|
359 | { |
---|
360 | TiXmlNode* returnNode = 0; |
---|
361 | |
---|
362 | p = SkipWhiteSpace( p ); |
---|
363 | if( !p || !*p || *p != '<' ) |
---|
364 | { |
---|
365 | return 0; |
---|
366 | } |
---|
367 | |
---|
368 | TiXmlDocument* doc = GetDocument(); |
---|
369 | p = SkipWhiteSpace( p ); |
---|
370 | |
---|
371 | if ( !p || !*p ) |
---|
372 | { |
---|
373 | return 0; |
---|
374 | } |
---|
375 | |
---|
376 | // What is this thing? |
---|
377 | // - Elements start with a letter or underscore, but xml is reserved. |
---|
378 | // - Comments: <!-- |
---|
379 | // - Decleration: <?xml |
---|
380 | // - Everthing else is unknown to tinyxml. |
---|
381 | // |
---|
382 | |
---|
383 | const char* xmlHeader = { "<?xml" }; |
---|
384 | const char* commentHeader = { "<!--" }; |
---|
385 | |
---|
386 | if ( StringEqual( p, xmlHeader, true ) ) |
---|
387 | { |
---|
388 | #ifdef DEBUG_PARSER |
---|
389 | TIXML_LOG( "XML parsing Declaration\n" ); |
---|
390 | #endif |
---|
391 | returnNode = new TiXmlDeclaration(); |
---|
392 | } |
---|
393 | else if ( isalpha( *(p+1) ) |
---|
394 | || *(p+1) == '_' ) |
---|
395 | { |
---|
396 | #ifdef DEBUG_PARSER |
---|
397 | TIXML_LOG( "XML parsing Element\n" ); |
---|
398 | #endif |
---|
399 | returnNode = new TiXmlElement( "" ); |
---|
400 | } |
---|
401 | else if ( StringEqual( p, commentHeader, false ) ) |
---|
402 | { |
---|
403 | #ifdef DEBUG_PARSER |
---|
404 | TIXML_LOG( "XML parsing Comment\n" ); |
---|
405 | #endif |
---|
406 | returnNode = new TiXmlComment(); |
---|
407 | } |
---|
408 | else |
---|
409 | { |
---|
410 | #ifdef DEBUG_PARSER |
---|
411 | TIXML_LOG( "XML parsing Unknown\n" ); |
---|
412 | #endif |
---|
413 | returnNode = new TiXmlUnknown(); |
---|
414 | } |
---|
415 | |
---|
416 | if ( returnNode ) |
---|
417 | { |
---|
418 | // Set the parent, so it can report errors |
---|
419 | returnNode->parent = this; |
---|
420 | //p = returnNode->Parse( p ); |
---|
421 | } |
---|
422 | else |
---|
423 | { |
---|
424 | if ( doc ) |
---|
425 | doc->SetError( TIXML_ERROR_OUT_OF_MEMORY ); |
---|
426 | } |
---|
427 | return returnNode; |
---|
428 | } |
---|
429 | |
---|
430 | #ifdef TIXML_USE_STL |
---|
431 | |
---|
432 | void TiXmlElement::StreamIn (TIXML_ISTREAM * in, TIXML_STRING * tag) |
---|
433 | { |
---|
434 | // We're called with some amount of pre-parsing. That is, some of "this" |
---|
435 | // element is in "tag". Go ahead and stream to the closing ">" |
---|
436 | while( in->good() ) |
---|
437 | { |
---|
438 | int c = in->get(); |
---|
439 | (*tag) += (char) c ; |
---|
440 | |
---|
441 | if ( c == '>' ) |
---|
442 | break; |
---|
443 | } |
---|
444 | |
---|
445 | if ( tag->length() < 3 ) return; |
---|
446 | |
---|
447 | // Okay...if we are a "/>" tag, then we're done. We've read a complete tag. |
---|
448 | // If not, identify and stream. |
---|
449 | |
---|
450 | if ( tag->at( tag->length() - 1 ) == '>' |
---|
451 | && tag->at( tag->length() - 2 ) == '/' ) |
---|
452 | { |
---|
453 | // All good! |
---|
454 | return; |
---|
455 | } |
---|
456 | else if ( tag->at( tag->length() - 1 ) == '>' ) |
---|
457 | { |
---|
458 | // There is more. Could be: |
---|
459 | // text |
---|
460 | // closing tag |
---|
461 | // another node. |
---|
462 | for ( ;; ) |
---|
463 | { |
---|
464 | StreamWhiteSpace( in, tag ); |
---|
465 | |
---|
466 | // Do we have text? |
---|
467 | if ( in->peek() != '<' ) |
---|
468 | { |
---|
469 | // Yep, text. |
---|
470 | TiXmlText text( "" ); |
---|
471 | text.StreamIn( in, tag ); |
---|
472 | |
---|
473 | // What follows text is a closing tag or another node. |
---|
474 | // Go around again and figure it out. |
---|
475 | continue; |
---|
476 | } |
---|
477 | |
---|
478 | // We now have either a closing tag...or another node. |
---|
479 | // We should be at a "<", regardless. |
---|
480 | if ( !in->good() ) return; |
---|
481 | assert( in->peek() == '<' ); |
---|
482 | size_t tagIndex = tag->length(); |
---|
483 | |
---|
484 | bool closingTag = false; |
---|
485 | bool firstCharFound = false; |
---|
486 | |
---|
487 | for( ;; ) |
---|
488 | { |
---|
489 | if ( !in->good() ) |
---|
490 | return; |
---|
491 | |
---|
492 | int c = in->peek(); |
---|
493 | |
---|
494 | if ( c == '>' ) |
---|
495 | break; |
---|
496 | |
---|
497 | *tag += c; |
---|
498 | in->get(); |
---|
499 | |
---|
500 | if ( !firstCharFound && c != '<' && !IsWhiteSpace( c ) ) |
---|
501 | { |
---|
502 | firstCharFound = true; |
---|
503 | if ( c == '/' ) |
---|
504 | closingTag = true; |
---|
505 | } |
---|
506 | } |
---|
507 | // If it was a closing tag, then read in the closing '>' to clean up the input stream. |
---|
508 | // If it was not, the streaming will be done by the tag. |
---|
509 | if ( closingTag ) |
---|
510 | { |
---|
511 | int c = in->get(); |
---|
512 | assert( c == '>' ); |
---|
513 | *tag += c; |
---|
514 | |
---|
515 | // We are done, once we've found our closing tag. |
---|
516 | return; |
---|
517 | } |
---|
518 | else |
---|
519 | { |
---|
520 | // If not a closing tag, id it, and stream. |
---|
521 | const char* tagloc = tag->c_str() + tagIndex; |
---|
522 | TiXmlNode* node = Identify( tagloc ); |
---|
523 | if ( !node ) |
---|
524 | return; |
---|
525 | node->StreamIn( in, tag ); |
---|
526 | delete node; |
---|
527 | node = 0; |
---|
528 | |
---|
529 | // No return: go around from the beginning: text, closing tag, or node. |
---|
530 | } |
---|
531 | } |
---|
532 | } |
---|
533 | } |
---|
534 | #endif |
---|
535 | |
---|
536 | const char* TiXmlElement::Parse( const char* p ) |
---|
537 | { |
---|
538 | p = SkipWhiteSpace( p ); |
---|
539 | TiXmlDocument* document = GetDocument(); |
---|
540 | |
---|
541 | if ( !p || !*p || *p != '<' ) |
---|
542 | { |
---|
543 | if ( document ) document->SetError( TIXML_ERROR_PARSING_ELEMENT ); |
---|
544 | return false; |
---|
545 | } |
---|
546 | |
---|
547 | p = SkipWhiteSpace( p+1 ); |
---|
548 | |
---|
549 | // Read the name. |
---|
550 | p = ReadName( p, &value ); |
---|
551 | if ( !p || !*p ) |
---|
552 | { |
---|
553 | if ( document ) document->SetError( TIXML_ERROR_FAILED_TO_READ_ELEMENT_NAME ); |
---|
554 | return false; |
---|
555 | } |
---|
556 | |
---|
557 | TIXML_STRING endTag ("</"); |
---|
558 | endTag += value; |
---|
559 | endTag += ">"; |
---|
560 | |
---|
561 | // Check for and read attributes. Also look for an empty |
---|
562 | // tag or an end tag. |
---|
563 | while ( p && *p ) |
---|
564 | { |
---|
565 | p = SkipWhiteSpace( p ); |
---|
566 | if ( !p || !*p ) |
---|
567 | { |
---|
568 | if ( document ) document->SetError( TIXML_ERROR_READING_ATTRIBUTES ); |
---|
569 | return 0; |
---|
570 | } |
---|
571 | if ( *p == '/' ) |
---|
572 | { |
---|
573 | ++p; |
---|
574 | // Empty tag. |
---|
575 | if ( *p != '>' ) |
---|
576 | { |
---|
577 | if ( document ) document->SetError( TIXML_ERROR_PARSING_EMPTY ); |
---|
578 | return 0; |
---|
579 | } |
---|
580 | return (p+1); |
---|
581 | } |
---|
582 | else if ( *p == '>' ) |
---|
583 | { |
---|
584 | // Done with attributes (if there were any.) |
---|
585 | // Read the value -- which can include other |
---|
586 | // elements -- read the end tag, and return. |
---|
587 | ++p; |
---|
588 | p = ReadValue( p ); // Note this is an Element method, and will set the error if one happens. |
---|
589 | if ( !p || !*p ) |
---|
590 | return 0; |
---|
591 | |
---|
592 | // We should find the end tag now |
---|
593 | if ( StringEqual( p, endTag.c_str(), false ) ) |
---|
594 | { |
---|
595 | p += endTag.length(); |
---|
596 | return p; |
---|
597 | } |
---|
598 | else |
---|
599 | { |
---|
600 | if ( document ) document->SetError( TIXML_ERROR_READING_END_TAG ); |
---|
601 | return 0; |
---|
602 | } |
---|
603 | } |
---|
604 | else |
---|
605 | { |
---|
606 | // Try to read an element: |
---|
607 | TiXmlAttribute attrib; |
---|
608 | attrib.SetDocument( document ); |
---|
609 | p = attrib.Parse( p ); |
---|
610 | |
---|
611 | if ( !p || !*p ) |
---|
612 | { |
---|
613 | if ( document ) document->SetError( TIXML_ERROR_PARSING_ELEMENT ); |
---|
614 | return 0; |
---|
615 | } |
---|
616 | SetAttribute( attrib.Name(), attrib.Value() ); |
---|
617 | } |
---|
618 | } |
---|
619 | return p; |
---|
620 | } |
---|
621 | |
---|
622 | |
---|
623 | const char* TiXmlElement::ReadValue( const char* p ) |
---|
624 | { |
---|
625 | TiXmlDocument* document = GetDocument(); |
---|
626 | |
---|
627 | // Read in text and elements in any order. |
---|
628 | p = SkipWhiteSpace( p ); |
---|
629 | while ( p && *p ) |
---|
630 | { |
---|
631 | if ( *p != '<' ) |
---|
632 | { |
---|
633 | // Take what we have, make a text element. |
---|
634 | TiXmlText* textNode = new TiXmlText( "" ); |
---|
635 | |
---|
636 | if ( !textNode ) |
---|
637 | { |
---|
638 | if ( document ) document->SetError( TIXML_ERROR_OUT_OF_MEMORY ); |
---|
639 | return 0; |
---|
640 | } |
---|
641 | |
---|
642 | p = textNode->Parse( p ); |
---|
643 | |
---|
644 | if ( !textNode->Blank() ) |
---|
645 | LinkEndChild( textNode ); |
---|
646 | else |
---|
647 | delete textNode; |
---|
648 | } |
---|
649 | else |
---|
650 | { |
---|
651 | // We hit a '<' |
---|
652 | // Have we hit a new element or an end tag? |
---|
653 | if ( StringEqual( p, "</", false ) ) |
---|
654 | { |
---|
655 | return p; |
---|
656 | } |
---|
657 | else |
---|
658 | { |
---|
659 | TiXmlNode* node = Identify( p ); |
---|
660 | if ( node ) |
---|
661 | { |
---|
662 | p = node->Parse( p ); |
---|
663 | LinkEndChild( node ); |
---|
664 | } |
---|
665 | else |
---|
666 | { |
---|
667 | return 0; |
---|
668 | } |
---|
669 | } |
---|
670 | } |
---|
671 | p = SkipWhiteSpace( p ); |
---|
672 | } |
---|
673 | |
---|
674 | if ( !p ) |
---|
675 | { |
---|
676 | if ( document ) document->SetError( TIXML_ERROR_READING_ELEMENT_VALUE ); |
---|
677 | } |
---|
678 | return p; |
---|
679 | } |
---|
680 | |
---|
681 | |
---|
682 | #ifdef TIXML_USE_STL |
---|
683 | void TiXmlUnknown::StreamIn( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
684 | { |
---|
685 | while ( in->good() ) |
---|
686 | { |
---|
687 | int c = in->get(); |
---|
688 | (*tag) += c; |
---|
689 | |
---|
690 | if ( c == '>' ) |
---|
691 | { |
---|
692 | // All is well. |
---|
693 | return; |
---|
694 | } |
---|
695 | } |
---|
696 | } |
---|
697 | #endif |
---|
698 | |
---|
699 | |
---|
700 | const char* TiXmlUnknown::Parse( const char* p ) |
---|
701 | { |
---|
702 | TiXmlDocument* document = GetDocument(); |
---|
703 | p = SkipWhiteSpace( p ); |
---|
704 | if ( !p || !*p || *p != '<' ) |
---|
705 | { |
---|
706 | if ( document ) document->SetError( TIXML_ERROR_PARSING_UNKNOWN ); |
---|
707 | return 0; |
---|
708 | } |
---|
709 | ++p; |
---|
710 | value = ""; |
---|
711 | |
---|
712 | while ( p && *p && *p != '>' ) |
---|
713 | { |
---|
714 | value += *p; |
---|
715 | ++p; |
---|
716 | } |
---|
717 | |
---|
718 | if ( !p ) |
---|
719 | { |
---|
720 | if ( document ) document->SetError( TIXML_ERROR_PARSING_UNKNOWN ); |
---|
721 | } |
---|
722 | if ( *p == '>' ) |
---|
723 | return p+1; |
---|
724 | return p; |
---|
725 | } |
---|
726 | |
---|
727 | #ifdef TIXML_USE_STL |
---|
728 | void TiXmlComment::StreamIn( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
729 | { |
---|
730 | while ( in->good() ) |
---|
731 | { |
---|
732 | int c = in->get(); |
---|
733 | (*tag) += c; |
---|
734 | |
---|
735 | if ( c == '>' |
---|
736 | && tag->at( tag->length() - 2 ) == '-' |
---|
737 | && tag->at( tag->length() - 3 ) == '-' ) |
---|
738 | { |
---|
739 | // All is well. |
---|
740 | return; |
---|
741 | } |
---|
742 | } |
---|
743 | } |
---|
744 | #endif |
---|
745 | |
---|
746 | |
---|
747 | const char* TiXmlComment::Parse( const char* p ) |
---|
748 | { |
---|
749 | TiXmlDocument* document = GetDocument(); |
---|
750 | value = ""; |
---|
751 | |
---|
752 | p = SkipWhiteSpace( p ); |
---|
753 | const char* startTag = "<!--"; |
---|
754 | const char* endTag = "-->"; |
---|
755 | |
---|
756 | if ( !StringEqual( p, startTag, false ) ) |
---|
757 | { |
---|
758 | document->SetError( TIXML_ERROR_PARSING_COMMENT ); |
---|
759 | return 0; |
---|
760 | } |
---|
761 | p += strlen( startTag ); |
---|
762 | p = ReadText( p, &value, false, endTag, false ); |
---|
763 | return p; |
---|
764 | } |
---|
765 | |
---|
766 | |
---|
767 | const char* TiXmlAttribute::Parse( const char* p ) |
---|
768 | { |
---|
769 | p = SkipWhiteSpace( p ); |
---|
770 | if ( !p || !*p ) return 0; |
---|
771 | |
---|
772 | // Read the name, the '=' and the value. |
---|
773 | p = ReadName( p, &name ); |
---|
774 | if ( !p || !*p ) |
---|
775 | { |
---|
776 | if ( document ) document->SetError( TIXML_ERROR_READING_ATTRIBUTES ); |
---|
777 | return 0; |
---|
778 | } |
---|
779 | p = SkipWhiteSpace( p ); |
---|
780 | if ( !p || !*p || *p != '=' ) |
---|
781 | { |
---|
782 | if ( document ) document->SetError( TIXML_ERROR_READING_ATTRIBUTES ); |
---|
783 | return 0; |
---|
784 | } |
---|
785 | |
---|
786 | ++p; // skip '=' |
---|
787 | p = SkipWhiteSpace( p ); |
---|
788 | if ( !p || !*p ) |
---|
789 | { |
---|
790 | if ( document ) document->SetError( TIXML_ERROR_READING_ATTRIBUTES ); |
---|
791 | return 0; |
---|
792 | } |
---|
793 | |
---|
794 | const char* end; |
---|
795 | |
---|
796 | if ( *p == '\'' ) |
---|
797 | { |
---|
798 | ++p; |
---|
799 | end = "\'"; |
---|
800 | p = ReadText( p, &value, false, end, false ); |
---|
801 | } |
---|
802 | else if ( *p == '"' ) |
---|
803 | { |
---|
804 | ++p; |
---|
805 | end = "\""; |
---|
806 | p = ReadText( p, &value, false, end, false ); |
---|
807 | } |
---|
808 | else |
---|
809 | { |
---|
810 | // All attribute values should be in single or double quotes. |
---|
811 | // But this is such a common error that the parser will try |
---|
812 | // its best, even without them. |
---|
813 | value = ""; |
---|
814 | while ( p && *p // existence |
---|
815 | && !isspace( *p ) && *p != '\n' && *p != '\r' // whitespace |
---|
816 | && *p != '/' && *p != '>' ) // tag end |
---|
817 | { |
---|
818 | value += *p; |
---|
819 | ++p; |
---|
820 | } |
---|
821 | } |
---|
822 | return p; |
---|
823 | } |
---|
824 | |
---|
825 | #ifdef TIXML_USE_STL |
---|
826 | void TiXmlText::StreamIn( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
827 | { |
---|
828 | while ( in->good() ) |
---|
829 | { |
---|
830 | int c = in->peek(); |
---|
831 | if ( c == '<' ) |
---|
832 | return; |
---|
833 | |
---|
834 | (*tag) += c; |
---|
835 | in->get(); |
---|
836 | } |
---|
837 | } |
---|
838 | #endif |
---|
839 | |
---|
840 | const char* TiXmlText::Parse( const char* p ) |
---|
841 | { |
---|
842 | value = ""; |
---|
843 | |
---|
844 | //TiXmlDocument* doc = GetDocument(); |
---|
845 | bool ignoreWhite = true; |
---|
846 | // if ( doc && !doc->IgnoreWhiteSpace() ) ignoreWhite = false; |
---|
847 | |
---|
848 | const char* end = "<"; |
---|
849 | p = ReadText( p, &value, ignoreWhite, end, false ); |
---|
850 | if ( p ) |
---|
851 | return p-1; // don't truncate the '<' |
---|
852 | return 0; |
---|
853 | } |
---|
854 | |
---|
855 | #ifdef TIXML_USE_STL |
---|
856 | void TiXmlDeclaration::StreamIn( TIXML_ISTREAM * in, TIXML_STRING * tag ) |
---|
857 | { |
---|
858 | while ( in->good() ) |
---|
859 | { |
---|
860 | int c = in->get(); |
---|
861 | (*tag) += c; |
---|
862 | |
---|
863 | if ( c == '>' ) |
---|
864 | { |
---|
865 | // All is well. |
---|
866 | return; |
---|
867 | } |
---|
868 | } |
---|
869 | } |
---|
870 | #endif |
---|
871 | |
---|
872 | const char* TiXmlDeclaration::Parse( const char* p ) |
---|
873 | { |
---|
874 | p = SkipWhiteSpace( p ); |
---|
875 | // Find the beginning, find the end, and look for |
---|
876 | // the stuff in-between. |
---|
877 | TiXmlDocument* document = GetDocument(); |
---|
878 | if ( !p || !*p || !StringEqual( p, "<?xml", true ) ) |
---|
879 | { |
---|
880 | if ( document ) document->SetError( TIXML_ERROR_PARSING_DECLARATION ); |
---|
881 | return 0; |
---|
882 | } |
---|
883 | |
---|
884 | p += 5; |
---|
885 | // const char* start = p+5; |
---|
886 | // const char* end = strstr( start, "?>" ); |
---|
887 | |
---|
888 | version = ""; |
---|
889 | encoding = ""; |
---|
890 | standalone = ""; |
---|
891 | |
---|
892 | while ( p && *p ) |
---|
893 | { |
---|
894 | if ( *p == '>' ) |
---|
895 | { |
---|
896 | ++p; |
---|
897 | return p; |
---|
898 | } |
---|
899 | |
---|
900 | p = SkipWhiteSpace( p ); |
---|
901 | if ( StringEqual( p, "version", true ) ) |
---|
902 | { |
---|
903 | // p += 7; |
---|
904 | TiXmlAttribute attrib; |
---|
905 | p = attrib.Parse( p ); |
---|
906 | version = attrib.Value(); |
---|
907 | } |
---|
908 | else if ( StringEqual( p, "encoding", true ) ) |
---|
909 | { |
---|
910 | // p += 8; |
---|
911 | TiXmlAttribute attrib; |
---|
912 | p = attrib.Parse( p ); |
---|
913 | encoding = attrib.Value(); |
---|
914 | } |
---|
915 | else if ( StringEqual( p, "standalone", true ) ) |
---|
916 | { |
---|
917 | // p += 10; |
---|
918 | TiXmlAttribute attrib; |
---|
919 | p = attrib.Parse( p ); |
---|
920 | standalone = attrib.Value(); |
---|
921 | } |
---|
922 | else |
---|
923 | { |
---|
924 | // Read over whatever it is. |
---|
925 | while( p && *p && *p != '>' && !isspace( *p ) ) |
---|
926 | ++p; |
---|
927 | } |
---|
928 | } |
---|
929 | return 0; |
---|
930 | } |
---|
931 | |
---|
932 | bool TiXmlText::Blank() const |
---|
933 | { |
---|
934 | for ( unsigned i=0; i<value.length(); i++ ) |
---|
935 | if ( !isspace( value[i] ) ) |
---|
936 | return false; |
---|
937 | return true; |
---|
938 | } |
---|
939 | |
---|