tinyxml2

FORK: TinyXML2 is a simple, small, efficient, C++ XML parser that can be easily integrated into other programs.
git clone https://git.neptards.moe/neptards/tinyxml2.git
Log | Files | Refs

html5-printer.cpp (3703B)


      1 //  g++ -Wall -O2 contrib/html5-printer.cpp -o html5-printer -ltinyxml2
      2 
      3 //  This program demonstrates how to use "tinyxml2" to generate conformant HTML5
      4 //  by deriving from the "tinyxml2::XMLPrinter" class.
      5 
      6 //  http://dev.w3.org/html5/markup/syntax.html
      7 
      8 //  In HTML5, there are 16 so-called "void" elements.  "void elements" NEVER have
      9 //  inner content (but they MAY have attributes), and are assumed to be self-closing.
     10 //  An example of a self-closig HTML5 element is "<br/>" (line break)
     11 //  All other elements are called "non-void" and MUST never self-close.
     12 //  Examples: "<div class='lolcats'></div>".
     13 
     14 //  tinyxml2::XMLPrinter will emit _ALL_ XML elements with no inner content as
     15 //  self-closing.  This behavior produces space-effeceint XML, but incorrect HTML5.
     16 
     17 //  Author: Dennis Jenkins,  dennis (dot) jenkins (dot) 75 (at) gmail (dot) com.
     18 //  License: Same as tinyxml2 (zlib, see below)
     19 //  This example is a small contribution to the world!  Enjoy it!
     20 
     21 /*
     22 This software is provided 'as-is', without any express or implied
     23 warranty. In no event will the authors be held liable for any
     24 damages arising from the use of this software.
     25 
     26 Permission is granted to anyone to use this software for any
     27 purpose, including commercial applications, and to alter it and
     28 redistribute it freely, subject to the following restrictions:
     29 
     30 1. The origin of this software must not be misrepresented; you must
     31 not claim that you wrote the original software. If you use this
     32 software in a product, an acknowledgment in the product documentation
     33 would be appreciated but is not required.
     34 
     35 2. Altered source versions must be plainly marked as such, and
     36 must not be misrepresented as being the original software.
     37 
     38 3. This notice may not be removed or altered from any source
     39 distribution.
     40 */
     41 
     42 
     43 #include "../tinyxml2.h"
     44 #include <iostream>
     45 
     46 #if defined (_MSC_VER)
     47 #define strcasecmp stricmp
     48 #endif
     49 
     50 using namespace tinyxml2;
     51 
     52 // Contrived input containing a mix of void and non-void HTML5 elements.
     53 // When printed via XMLPrinter, some non-void elements will self-close (not valid HTML5).
     54 static const char input[] =
     55 "<html><body><p style='a'></p><br/>&copy;<col a='1' b='2'/><div a='1'></div></body></html>";
     56 
     57 // XMLPrinterHTML5 is small enough, just put the entire implementation inline.
     58 class	XMLPrinterHTML5 : public XMLPrinter
     59 {
     60 public:
     61     XMLPrinterHTML5 (FILE* file=0, bool compact = false, int depth = 0) :
     62         XMLPrinter (file, compact, depth)
     63     {}
     64 
     65 protected:
     66     virtual void CloseElement () {
     67         if (_elementJustOpened && !isVoidElement (_stack.PeekTop())) {
     68             SealElementIfJustOpened();
     69             }
     70         XMLPrinter::CloseElement();
     71     }
     72 
     73     virtual bool isVoidElement (const char *name) {
     74 // Complete list of all HTML5 "void elements",
     75 // http://dev.w3.org/html5/markup/syntax.html
     76         static const char *list[] = {
     77             "area", "base", "br", "col", "command", "embed", "hr", "img",
     78             "input", "keygen", "link", "meta", "param", "source", "track", "wbr",
     79             NULL
     80         };
     81 
     82 // I could use 'bsearch', but I don't have MSVC to test on (it would work with gcc/libc).
     83         for (const char **p = list; *p; ++p) {
     84             if (!strcasecmp (name, *p)) {
     85                 return true;
     86             }
     87         }
     88 
     89         return false;
     90     }
     91 };
     92 
     93 int	main (void) {
     94     XMLDocument doc (false);
     95     doc.Parse (input);
     96 
     97     std::cout << "INPUT:\n" << input << "\n\n";
     98 
     99     XMLPrinter prn (NULL, true);
    100     doc.Print (&prn);
    101     std::cout << "XMLPrinter (not valid HTML5):\n" << prn.CStr() << "\n\n";
    102 
    103     XMLPrinterHTML5 html5 (NULL, true);
    104     doc.Print (&html5);
    105     std::cout << "XMLPrinterHTML5:\n" << html5.CStr() << "\n";
    106 
    107     return 0;
    108 }