libxml是一個實現了讀,建立和操做xml數據等功能的c語言庫,對於其具體的API,可參考官方文檔,這裏只介紹一些經常使用的用法。
node
libxml在操做xml數據時,定義了幾種節點類型:測試
Enum xmlElementType { XML_ELEMENT_NODE = 1 XML_ATTRIBUTE_NODE = 2 XML_TEXT_NODE = 3 XML_CDATA_SECTION_NODE = 4 XML_ENTITY_REF_NODE = 5 XML_ENTITY_NODE = 6 XML_PI_NODE = 7 XML_COMMENT_NODE = 8 XML_DOCUMENT_NODE = 9 XML_DOCUMENT_TYPE_NODE = 10 XML_DOCUMENT_FRAG_NODE = 11 XML_NOTATION_NODE = 12 XML_HTML_DOCUMENT_NODE = 13 XML_DTD_NODE = 14 XML_ELEMENT_DECL = 15 XML_ATTRIBUTE_DECL = 16 XML_ENTITY_DECL = 17 XML_NAMESPACE_DECL = 18 XML_XINCLUDE_START = 19 XML_XINCLUDE_END = 20 XML_DOCB_DOCUMENT_NODE = 21 }
比較經常使用的是XML_ELEMENT_NODE,XML_TEXT_NODE和XML_ATTRIBUTE_NODE,可稱爲元素節點,文本節點和屬性節點;它們都是xmlNode結構體類型的,且能夠經過curnode->type來得到類型。這幾種節點分別對應xml的不一樣數據,如下面xml文檔來講明,story和storyinfo是元素節點,而John Fleck就是文本節點。在結構上John Fleck文本節點是<author>元素節點的子節點。spa
測試xml:code
<?xml version="1.0"?> <story> <storyinfo> <author>John Fleck</author> <datewritten>June 2, 2002</datewritten> <keyword>example keyword</keyword> </storyinfo> <body> <headline>This is the headline</headline> <para>This is the body text.</para> </body> </story>
1. 解析文檔:orm
xmlDocPtr doc; xmlNodePtr cur; doc = xmlParseFile(docname); if (doc == NULL ) { fprintf(stderr,"Document not parsed successfully. \n"); return; } cur = xmlDocGetRootElement(doc); if (cur == NULL) { fprintf(stderr,"empty document\n"); xmlFreeDoc(doc); return; } if (xmlStrcmp(cur->name, (const xmlChar *) "story")) { fprintf(stderr,"document of the wrong type, root node != story"); xmlFreeDoc(doc); return; }
2. 檢索節點:xml
void parseStory (xmlDocPtr doc, xmlNodePtr cur) { xmlChar *key; cur = cur->xmlChildrenNode; while (cur != NULL) { if ((!xmlStrcmp(cur->name, (const xmlChar *)"keyword"))) { key = xmlNodeListGetString(doc, cur->xmlChildrenNode, 1); printf("keyword: %s\n", key); xmlFree(key); } cur = cur->next; } return; }
3. XPATH方式檢索文檔:
除了遍歷文檔樹來尋找某個節點外,libxml2還支持使用XPATH表達式來尋找符合指定搜索規則的節點集。xpath的內容可參見:http://www.w3schools.com/xpath/xpath_operators.asp 和 http://www.w3.org/TR/xpath/ 。測試可參:http://www.xpathtester.com/test 。這裏是幾個簡單的用法,"/Infomation/CameraSet"取的是絕對路徑,"//CameraItem"取的是相對路徑,數字可直接用等號比較,文本則要用text()取其內容進行比較。文檔
char expr[128]; sprintf(expr, "/Information/CameraSet/CameraItem[IP[text()='%s']]", pItem->sIP); sprintf(expr, "/Information/CameraSet/CameraItem[Index=%d]/VarTrafficLine", iIndex); xpObjPtr = getnodeset(doc, (xmlChar*)expr);
4. 添加節點和獲取文本:
設置元素節點的文本可以使用xmlNodeSetContent(cur, (const xmlChar*)"sssss");也有其餘方式,以下面代碼中。獲取文本:xmlNodeGetContent(cur)和xmlNodeListGetString(doc, nodelist, inline);第一個方法獲取的是cur的子孫節點中類型是TEXT或者ENTITY_REF的節點的內容拼接的字符串;第二個方法只取當前節點鏈表中類型是TEXT或者ENTITY_REF的節點的內容。字符串
newnode = xmlNewNode(NULL, (const xmlChar*)"NewNode"); xmlAddChild(cur, newnode); xmlNewTextChild(newnode, NULL, (const xmlChar*)"Code", (const xmlChar*)"1001"); xmlNewTextChild(newnode, NULL, (const xmlChar*)"Name", (const xmlChar*)"anewnode"); textnode = xmlNewText((const xmlChar*)"abcdefg"); //向已存在的元素節點添加文本 xmlAddChild(cur, textnode);
5. 刪除節點:get
xmlUnlinkNode(cur); xmlFreeNode(cur);
這樣刪除指定節點後,會自動造成新的節點樹結構,而不會打亂原來的結構,如:刪除<author>節點後,<storyinfo>的第一個子節點就變成<datewritten>,<datewritten>的前驅節點是NULL,而不是刪除前的<author>了。it
代碼:
#include <libxml/parser.h> #include <libxml/xpath.h> xmlDocPtr getdoc (char *docname) { xmlDocPtr doc; doc = xmlParseFile(docname); if (doc == NULL ) { fprintf(stderr,"Document not parsed successfully. \n"); return NULL; } return doc; } xmlXPathObjectPtr getnodeset (xmlDocPtr doc, xmlChar *xpath){ xmlXPathContextPtr context; xmlXPathObjectPtr result; context = xmlXPathNewContext(doc); if (context == NULL) { printf("Error in xmlXPathNewContext\n"); return NULL; } result = xmlXPathEvalExpression(xpath, context); xmlXPathFreeContext(context); if (result == NULL) { printf("Error in xmlXPathEvalExpression\n"); return NULL; } if(xmlXPathNodeSetIsEmpty(result->nodesetval)){ xmlXPathFreeObject(result); printf("No result\n"); return NULL; } return result; } int main(int argc, char **argv) { char *docname; xmlDocPtr doc; xmlChar *xpath = (xmlChar*) "//root"; xmlNodeSetPtr nodeset; xmlXPathObjectPtr result; int i; xmlChar *keyword; if (argc <= 1) { printf("Usage: %s docname\n", argv[0]); return(0); } docname = argv[1]; doc = getdoc(docname); result = getnodeset (doc, xpath); if (result) { nodeset = result->nodesetval; for (i=0; i < nodeset->nodeNr; i++) { keyword = xmlNodeListGetString(doc, nodeset->nodeTab[i]->xmlChildrenNode,1); printf("keyword1: %s\n", keyword); xmlFree(keyword); } xmlXPathFreeObject (result); } xmlFreeDoc(doc); xmlCleanupParser(); return (1); }