///////////////////////////////////////////////////////////////////////////// // Name: xml/xml.h // Purpose: interface of wxXmlNode, wxXmlAttribute, wxXmlDocument // Author: wxWidgets team // Licence: wxWindows licence ///////////////////////////////////////////////////////////////////////////// /// Represents XML node type. enum wxXmlNodeType { // note: values are synchronized with xmlElementType from libxml wxXML_ELEMENT_NODE = 1, wxXML_ATTRIBUTE_NODE = 2, wxXML_TEXT_NODE = 3, wxXML_CDATA_SECTION_NODE = 4, wxXML_ENTITY_REF_NODE = 5, wxXML_ENTITY_NODE = 6, wxXML_PI_NODE = 7, wxXML_COMMENT_NODE = 8, wxXML_DOCUMENT_NODE = 9, wxXML_DOCUMENT_TYPE_NODE = 10, wxXML_DOCUMENT_FRAG_NODE = 11, wxXML_NOTATION_NODE = 12, wxXML_HTML_DOCUMENT_NODE = 13 }; /** @class wxXmlNode Represents a node in an XML document. See wxXmlDocument. Node has a name and may have content and attributes. Most common node types are @c wxXML_TEXT_NODE (name and attributes are irrelevant) and @c wxXML_ELEMENT_NODE. Example: in \hi\ there is an element with the name @c title and irrelevant content and one child of type @c wxXML_TEXT_NODE with @c hi as content. The @c wxXML_PI_NODE type sets the name to the PI target and the contents to the instructions. Note that whilst the PI instructions are often in the form of pseudo-attributes these do not use the nodes attribute system. It is the users responsibility to code and decode the instruction text. If @c wxUSE_UNICODE is 0, all strings are encoded in the encoding given to wxXmlDocument::Load (default is UTF-8). @library{wxxml} @category{xml} @see wxXmlDocument, wxXmlAttribute */ class wxXmlNode { public: /** Creates this XML node and eventually insert it into an existing XML tree. @param parent The parent node to which append this node instance. If this argument is @NULL this new node will be floating and it can be appended later to another one using the AddChild() or InsertChild() functions. Otherwise the child is already added to the XML tree by this constructor and it shouldn't be done again. @param type One of the ::wxXmlNodeType enumeration value. @param name The name of the node. This is the string which appears between angular brackets. @param content The content of the node. Only meaningful when type is @c wxXML_TEXT_NODE or @c wxXML_CDATA_SECTION_NODE. @param attrs If not @NULL, this wxXmlAttribute object and its eventual siblings are attached to the node. @param next If not @NULL, this node and its eventual siblings are attached to the node. @param lineNo Number of line this node was present at in input file or -1. */ wxXmlNode(wxXmlNode* parent, wxXmlNodeType type, const wxString& name, const wxString& content = wxEmptyString, wxXmlAttribute* attrs = NULL, wxXmlNode* next = NULL, int lineNo = -1); /** A simplified version of the first constructor form, assuming a @NULL parent. @param type One of the ::wxXmlNodeType enumeration value. @param name The name of the node. This is the string which appears between angular brackets. @param content The content of the node. Only meaningful when type is @c wxXML_TEXT_NODE or @c wxXML_CDATA_SECTION_NODE. @param lineNo Number of line this node was present at in input file or -1. */ wxXmlNode(wxXmlNodeType type, const wxString& name, const wxString& content = wxEmptyString, int lineNo = -1); /** Copy constructor. Note that this does NOT copy siblings and parent pointer, i.e. GetParent() and GetNext() will return @NULL after using copy ctor and are never unmodified by operator=(). On the other hand, it DOES copy children and attributes. */ wxXmlNode(const wxXmlNode& node); /** The virtual destructor. Deletes attached children and attributes. */ virtual ~wxXmlNode(); /** Appends a attribute with given @a name and @a value to the list of attributes for this node. */ virtual void AddAttribute(const wxString& name, const wxString& value); /** Appends given attribute to the list of attributes for this node. */ virtual void AddAttribute(wxXmlAttribute* attr); /** Adds node @a child as the last child of this node. @note Note that this function works in O(n) time where @e n is the number of existing children. Consequently, adding large number of child nodes using this method can be expensive, because it has O(n^2) time complexity in number of nodes to be added. Use InsertChildAfter() to populate XML tree in linear time. @see InsertChild(), InsertChildAfter() */ virtual void AddChild(wxXmlNode* child); /** Removes the first attributes which has the given @a name from the list of attributes for this node. */ virtual bool DeleteAttribute(const wxString& name); /** Returns true if a attribute named attrName could be found. The value of that attribute is saved in value (which must not be @NULL). */ bool GetAttribute(const wxString& attrName, wxString* value) const; /** Returns the value of the attribute named @a attrName if it does exist. If it does not exist, the @a defaultVal is returned. */ wxString GetAttribute(const wxString& attrName, const wxString& defaultVal = wxEmptyString) const; /** Return a pointer to the first attribute of this node. */ wxXmlAttribute* GetAttributes() const; /** Returns the first child of this node. To get a pointer to the second child of this node (if it does exist), use the GetNext() function on the returned value. */ wxXmlNode* GetChildren() const; /** Returns the content of this node. Can be an empty string. Be aware that for nodes of type @c wxXML_ELEMENT_NODE (the most used node type) the content is an empty string. See GetNodeContent() for more details. */ const wxString& GetContent() const; /** Returns the number of nodes which separate this node from @c grandparent. This function searches only the parents of this node until it finds @a grandparent or the @NULL node (which is the parent of non-linked nodes or the parent of a wxXmlDocument's root element node). */ int GetDepth(wxXmlNode* grandparent = NULL) const; /** Returns a flag indicating whether encoding conversion is necessary when saving. The default is @false. You can improve saving efficiency considerably by setting this value. */ bool GetNoConversion() const; /** Returns line number of the node in the input XML file or @c -1 if it is unknown. */ int GetLineNumber() const; /** Returns the name of this node. Can be an empty string (e.g. for nodes of type @c wxXML_TEXT_NODE or @c wxXML_CDATA_SECTION_NODE). */ const wxString& GetName() const; /** Returns a pointer to the sibling of this node or @NULL if there are no siblings. */ wxXmlNode* GetNext() const; /** Returns the content of the first child node of type @c wxXML_TEXT_NODE or @c wxXML_CDATA_SECTION_NODE. This function is very useful since the XML snippet @c "tagnametagcontent/tagname" is represented by expat with the following tag tree: @code wxXML_ELEMENT_NODE name="tagname", content="" |-- wxXML_TEXT_NODE name="", content="tagcontent" @endcode or eventually: @code wxXML_ELEMENT_NODE name="tagname", content="" |-- wxXML_CDATA_SECTION_NODE name="", content="tagcontent" @endcode An empty string is returned if the node has no children of type @c wxXML_TEXT_NODE or @c wxXML_CDATA_SECTION_NODE, or if the content of the first child of such types is empty. */ wxString GetNodeContent() const; /** Returns a pointer to the parent of this node or @NULL if this node has no parent. */ wxXmlNode* GetParent() const; /** Returns the type of this node. */ wxXmlNodeType GetType() const; /** Returns @true if this node has a attribute named @a attrName. */ bool HasAttribute(const wxString& attrName) const; /** Inserts the @a child node immediately before @a followingNode in the children list. @return @true if @a followingNode has been found and the @a child node has been inserted. @note For historical reasons, @a followingNode may be @NULL. In that case, then @a child is prepended to the list of children and becomes the first child of this node, i.e. it behaves identically to using the first children (as returned by GetChildren()) for @a followingNode). @see AddChild(), InsertChildAfter() */ virtual bool InsertChild(wxXmlNode* child, wxXmlNode* followingNode); /** Inserts the @a child node immediately after @a precedingNode in the children list. @return @true if @a precedingNode has been found and the @a child node has been inserted. @param child The child to insert. @param precedingNode The node to insert @a child after. As a special case, this can be @NULL if this node has no children yet -- in that case, @a child will become this node's only child node. @since 2.8.8 @see InsertChild(), AddChild() */ virtual bool InsertChildAfter(wxXmlNode* child, wxXmlNode* precedingNode); /** Returns @true if the content of this node is a string containing only whitespaces (spaces, tabs, new lines, etc). Note that this function is locale-independent since the parsing of XML documents must always produce the exact same tree regardless of the locale it runs under. */ bool IsWhitespaceOnly() const; /** Removes the given node from the children list. Returns @true if the node was found and removed or @false if the node could not be found. Note that the caller is responsible for deleting the removed node in order to avoid memory leaks. */ virtual bool RemoveChild(wxXmlNode* child); /** Sets as first attribute the given wxXmlAttribute object. The caller is responsible for deleting any previously present attributes attached to this node. */ void SetAttributes(wxXmlAttribute* attr); /** Sets as first child the given node. The caller is responsible for deleting any previously present children node. */ void SetChildren(wxXmlNode* child); /** Sets the content of this node. */ void SetContent(const wxString& con); /** Sets the name of this node. */ void SetName(const wxString& name); /** Sets as sibling the given node. The caller is responsible for deleting any previously present sibling node. */ void SetNext(wxXmlNode* next); /** Sets a flag to indicate whether encoding conversion is necessary when saving. The default is @false. You can improve saving efficiency considerably by setting this value. */ void SetNoConversion(bool noconversion); /** Sets as parent the given node. The caller is responsible for deleting any previously present parent node. */ void SetParent(wxXmlNode* parent); /** Sets the type of this node. */ void SetType(wxXmlNodeType type); /** See the copy constructor for more info. */ wxXmlNode& operator=(const wxXmlNode& node); }; /** @class wxXmlAttribute Represents a node attribute. Example: in \, @c src is an attribute with value @c hello.gif and @c id is an attribute with value @c 3. @library{wxxml} @category{xml} @see wxXmlDocument, wxXmlNode */ class wxXmlAttribute { public: /** Default constructor. */ wxXmlAttribute(); /** Creates the attribute with given @a name and @a value. If @a next is not @NULL, then sets it as sibling of this attribute. */ wxXmlAttribute(const wxString& name, const wxString& value, wxXmlAttribute* next = NULL); /** The virtual destructor. */ virtual ~wxXmlAttribute(); /** Returns the name of this attribute. */ wxString GetName() const; /** Returns the sibling of this attribute or @NULL if there are no siblings. */ wxXmlAttribute* GetNext() const; /** Returns the value of this attribute. */ wxString GetValue() const; /** Sets the name of this attribute. */ void SetName(const wxString& name); /** Sets the sibling of this attribute. */ void SetNext(wxXmlAttribute* next); /** Sets the value of this attribute. */ void SetValue(const wxString& value); }; //* special indentation value for wxXmlDocument::Save #define wxXML_NO_INDENTATION (-1) //* flags for wxXmlDocument::Load enum wxXmlDocumentLoadFlag { wxXMLDOC_NONE, wxXMLDOC_KEEP_WHITESPACE_NODES }; /** @class wxXmlDocument This class holds XML data/document as parsed by XML parser in the root node. wxXmlDocument internally uses the expat library which comes with wxWidgets to parse the given stream. A simple example of using XML classes is: @code wxXmlDocument doc; if (!doc.Load("myfile.xml")) return false; // start processing the XML file if (doc.GetRoot()->GetName() != "myroot-node") return false; // examine prologue wxXmlNode *prolog = doc.GetDocumentNode()->GetChildren(); while (prolog) { if (prolog->GetType() == wxXML_PI_NODE && prolog->GetName() == "target") { // process Process Instruction contents wxString pi = prolog->GetContent(); ... } } wxXmlNode *child = doc.GetRoot()->GetChildren(); while (child) { if (child->GetName() == "tag1") { // process text enclosed by tag1/tag1 wxString content = child->GetNodeContent(); ... // process attributes of tag1 wxString attrvalue1 = child->GetAttribute("attr1", "default-value"); wxString attrvalue2 = child->GetAttribute("attr2", "default-value"); ... } else if (child->GetName() == "tag2") { // process tag2 ... } child = child->GetNext(); } @endcode Note that if you want to preserve the original formatting of the loaded file including whitespaces and indentation, you need to turn off whitespace-only textnode removal and automatic indentation: @code wxXmlDocument doc; doc.Load("myfile.xml", "UTF-8", wxXMLDOC_KEEP_WHITESPACE_NODES); // myfile2.xml will be identical to myfile.xml saving it this way: doc.Save("myfile2.xml", wxXML_NO_INDENTATION); @endcode Using default parameters, you will get a reformatted document which in general is different from the original loaded content: @code wxXmlDocument doc; doc.Load("myfile.xml"); doc.Save("myfile2.xml"); // myfile2.xml != myfile.xml @endcode @library{wxxml} @category{xml} @see wxXmlNode, wxXmlAttribute */ class wxXmlDocument : public wxObject { public: /** Default constructor. */ wxXmlDocument(); /** Copy constructor. Deep copies all the XML tree of the given document. */ wxXmlDocument(const wxXmlDocument& doc); /** Loads the given filename using the given encoding. See Load(). */ wxXmlDocument(const wxString& filename, const wxString& encoding = "UTF-8")); /** Loads the XML document from given stream using the given encoding. See Load(). */ wxXmlDocument(wxInputStream& stream, const wxString& encoding = "UTF-8"); /** Virtual destructor. Frees the document root node. */ virtual ~wxXmlDocument(); /** Appends a Process Instruction or Comment node to the document prologue. Calling this function will create a prologue or attach the node to the end of an existing prologue. @since 2.9.2 */ void AppendToProlog(wxXmlNode* node); /** Detaches the document node and returns it. The document node will be set to @NULL and thus IsOk() will return @false after calling this function. Note that the caller is responsible for deleting the returned node in order to avoid memory leaks. @since 2.9.2 */ wxXmlNode* DetachDocumentNode(); /** Detaches the root entity node and returns it. After calling this function, the document node will remain together with any prologue nodes, but IsOk() will return @false since the root entity will be missing. Note that the caller is responsible for deleting the returned node in order to avoid memory leaks. */ wxXmlNode* DetachRoot(); /** Returns encoding of in-memory representation of the document (same as passed to Load() or constructor, defaults to UTF-8). @note this is meaningless in Unicode build where data are stored as @c wchar_t*. */ wxString GetEncoding() const; /** Returns encoding of document (may be empty). @note This is the encoding original file was saved in, @b not the encoding of in-memory representation! */ const wxString& GetFileEncoding() const; /** Returns the document node of the document. @since 2.9.2 */ wxXmlNode* GetDocumentNode() const; /** Returns the root element node of the document. */ wxXmlNode* GetRoot() const; /** Returns the version of document. This is the value in the @c \ header of the XML document. If the version attribute was not explicitly given in the header, this function returns an empty string. */ const wxString& GetVersion() const; /** Returns @true if the document has been loaded successfully. */ bool IsOk() const; /** Parses @a filename as an xml document and loads its data. If @a flags does not contain wxXMLDOC_KEEP_WHITESPACE_NODES, then, while loading, all nodes of type @c wxXML_TEXT_NODE (see wxXmlNode) are automatically skipped if they contain whitespaces only. The removal of these nodes makes the load process slightly faster and requires less memory however makes impossible to recreate exactly the loaded text with a Save() call later. Read the initial description of this class for more info. Returns true on success, false otherwise. */ virtual bool Load(const wxString& filename, const wxString& encoding = "UTF-8", int flags = wxXMLDOC_NONE); /** Like Load(const wxString&, const wxString&, int) but takes the data from given input stream. */ virtual bool Load(wxInputStream& stream, const wxString& encoding = "UTF-8", int flags = wxXMLDOC_NONE); /** Saves XML tree creating a file named with given string. If @a indentstep is greater than or equal to zero, then, while saving, an automatic indentation is added with steps composed by indentstep spaces. If @a indentstep is @c wxXML_NO_INDENTATION, then, automatic indentation is turned off. */ virtual bool Save(const wxString& filename, int indentstep = 2) const; /** Saves XML tree in the given output stream. See Save(const wxString&, int) for a description of @a indentstep. */ virtual bool Save(wxOutputStream& stream, int indentstep = 2) const; /** Sets the document node of this document. Deletes any previous document node. Use DetachDocumentNode() and then SetDocumentNode() if you want to replace the document node without deleting the old document tree. @since 2.9.2 */ void SetDocumentNode(wxXmlNode* node); /** Sets the encoding of the document. */ void SetEncoding(const wxString& enc); /** Sets the enconding of the file which will be used to save the document. */ void SetFileEncoding(const wxString& encoding); /** Sets the root element node of this document. Will create the document node if necessary. Any previous root element node is deleted. */ void SetRoot(wxXmlNode* node); /** Sets the version of the XML file which will be used to save the document. */ void SetVersion(const wxString& version); /** Deep copies the given document. */ wxXmlDocument& operator=(const wxXmlDocument& doc); /** Get expat library version information. @since 2.9.2 @see wxVersionInfo */ static wxVersionInfo GetLibraryVersionInfo(); };