[Linux C]利用libxml2解析xml文件

linux-dash

A beautiful web dashboard for Linux

项目地址：https://gitcode.com/gh_mirrors/li/linux-dash

免费下载资源

kevin_Android_123456

5881人浏览 · 2012-12-27 13:43:15

kevin_Android_123456 · 2012-12-27 13:43:15 发布

[Linux C]利用libxml2解析xml文件

分类： Linux_C 2012-03-09 15:42 382人阅读评论(0) 收藏举报

为了解析xml，可以使用Linux下默认安装的libxml2。

[cpp]view plaincopy 
    
 /* 
     a.c 
     功能：利用libxml2解析xml文件 
 */  
   
 #include <stdio.h>  
 #include <stdlib.h>  
 #include <string.h>  
 #include <unistd.h>  
 #include <libgen.h>  
 #include <libxml/xmlmemory.h>  
 #include <libxml/parser.h>  
 #include <libxml/xpath.h>  
   
 int GetCurFilePath(char *lpOut)     // get full path of the executable file  
 {  
     char chPath[BUFSIZ] = {0};  
     int nRetVal = readlink("/proc/self/exe", chPath, sizeof(chPath)); // get full path of the current-executable file  
     if(nRetVal < 0)  
     {  
         strcpy(lpOut, ".");  
         return -1;  
     }  
     else  
     {  
         strcpy(lpOut, chPath);  
         return 0;  
     }  
 }  
   
 int GetCurDir(char *lpOut)                                  // get directory-path of current executable-file  
 {  
     char    chPath[BUFSIZ] = { 0 };  
     if( GetCurFilePath(chPath) < 0 )  
         return - 1;  
     dirname(chPath);                                        // dirname will change value of "chPath"(contain result)  
     strcpy(lpOut, chPath);                                  // copy result to out-param  
   
     return 0;  
 }  
   
 xmlDocPtr getdoc(char *docname)                         // 根据文件名得到文档指针  
 {  
     xmlDocPtr doc;  
     doc = xmlParseFile(docname);  
     if(doc == NULL)  
     {  
         fprintf(stderr, "Document not parsed successfully.\n");  
         return NULL;  
     }  
     return doc;  
 }  
   
 // 在文档doc中解析xpath表达式，返回结果集指针  
 xmlXPathObjectPtr getnodeset(xmlDocPtr doc, xmlChar *xpath)  
 {  
     xmlXPathContextPtr context;  
     xmlXPathObjectPtr result;  
     context = xmlXPathNewContext(doc);  
     if(context == NULL)  
     {  
         printf("Error in xmlXPathNewContent\n");  
         return NULL;  
     }  
     result = xmlXPathEvalExpression(xpath, context);        // 在context中解析表达式xpath  
     xmlXPathFreeContext(context);                           // 释放context  
     if(result == NULL)  
     {  
         printf("Error in xmlXPathEvalExpression\n");  
         return NULL;  
     }  
     if(xmlXPathNodeSetIsEmpty(result->nodesetval))           // 解析表达式的结果集为空  
     {  
         xmlXPathFreeObject(result);  
         printf("No result\n");  
         return NULL;  
     }  
     return result;  
 }  
   
 // 解析xmlPath路径的结点  
 void testReadXmlDoc(char *filepath, char *xmlPath)  
 {  
     xmlDocPtr doc = getdoc(filepath);  
     if(NULL == doc)  
         return ;  
   
     xmlChar *xpath = (xmlChar*) xmlPath;  
     xmlXPathObjectPtr result = getnodeset(doc, xpath);          // 获取结果集  
     if(result)  
     {  
         xmlNodeSetPtr nodeset = result->nodesetval;  
         xmlChar *name, *value;  
         printf("nodeset->nodeNr = %d\n", nodeset->nodeNr);        // 打印结果集中结点个数  
         for(int i = 0; i < nodeset->nodeNr; i++)  
         {  
             xmlNodePtr cur = nodeset->nodeTab[i];                // products  
             printf("cur->name = %s\n", cur->name);  
             cur = cur->xmlChildrenNode;  
             while(cur)  
             {  
                 if(xmlStrcmp(cur->name, (const xmlChar*) "text"))        // cur->name不为"text"  
                 {  
                     printf("cur->name = %s\t", cur->name);  
                     name = xmlGetProp(cur, (const xmlChar*) "name");    // 获取属性值  
                     value = xmlGetProp(cur, (const xmlChar*) "value");  
                     printf("name = %s, value = %s\n", name, value);  
                     xmlFree(name);  
                     xmlFree(value);  
                 }  
                 cur = cur->next;  
             }  
             printf("\n");  
         }  
         xmlXPathFreeObject(result);  
     }  
     xmlFreeDoc(doc);  
     xmlCleanupParser();  
 }  
   
 int main(void)  
 {  
     char curDir[100] = {0};  
     char docname[100] = {0};  
     GetCurDir(curDir);  
     strcpy(docname, curDir);  
     strcat(docname, "/dprod.xml");  
     testReadXmlDoc(docname, "/allproducts/products");  
   
     return EXIT_SUCCESS;  
 }  

makefile文件：

[python]view plaincopy 
    
 CC=gcc  
 CFLAGS=  
 BIN=a  
 INC=/usr/include/libxml2  
   
 $(BIN): $(BIN).c  
     $(CC) $(CFLAGS) -o $(BIN) $(BIN).c -I$(INC) -lxml2 -std=c99  
   
 clean:  
     rm -f *.o $(BIN)  

xml文件(dprod.xml)内容：

[html]view plaincopy 
    
 <?xml version="1.0"?>  
 <allproducts>  
   <products>  
     <product name="name11" value="value11" />  
     <product name="name12" value="value12" />  
     <product name="name13" value="value13" />  
     <product name="name14" value="value14" />  
   </products>  
   <products>  
     <product name="name21" value="value21" />  
     <product name="name22" value="value22" />  
     <product name="name23" value="value23" />  
   </products>  
   <products>  
     <product name="name31" value="value31" />  
     <product name="name32" value="value32" />  
   </products>  
 </allproducts>  

编译运行：

[plain]view plaincopy 
    
 [zcm@tmp #115]$make  
 gcc  -o a a.c -I/usr/include/libxml2 -lxml2 -std=c99  
 a.c: 在函数‘GetCurFilePath’中:  
 a.c:18: 警告：隐式声明函数‘readlink’  
 [zcm@tmp #116]$./a  
 nodeset->nodeNr = 3  
 cur->name = products  
 cur->name = product  name = name11, value = value11  
 cur->name = product  name = name12, value = value12  
 cur->name = product  name = name13, value = value13  
 cur->name = product  name = name14, value = value14  
   
 cur->name = products  
 cur->name = product  name = name21, value = value21  
 cur->name = product  name = name22, value = value22  
 cur->name = product  name = name23, value = value23  
   
 cur->name = products  
 cur->name = product  name = name31, value = value31  
 cur->name = product  name = name32, value = value32  
   
 [zcm@tmp #117]$  

说明：对于编译中出现的“a.c:18: 警告：隐式声明函数‘readlink’”错误，实在不能明白。我查了下手册，这个函数在unistd.h中，而且我也已经#include了，为什么还会出现这个错误呢？

后来突然想到，可能是-std=c99的原因，将它改为-std=gnu99后，这个警告就没有了!

--------------------------------------------------------------------------------------------------------------------------------------------------

修改了xml文件和上面源码中的testReadXmlDoc()后，发现结果相当神奇，看来对libxml2的理解还是比较缺乏。

1. 修改xml文件内容：

[html]view plaincopy 
    
 <?xml version="1.0"?>  
 <allproducts>  
   <products>h1  
     <product name="name11" value="value11" />h2  
     <product name="name12" value="value12" />h3  
     <product name="name13" value="value13" />h4  
     <product name="name14" value="value14" />h5  
   </products>  
   <products>  
     <product name="name21" value="value21" />  
     <product name="name22" value="value22" />  
     <product name="name23" value="value23" />  
   </products>  
   <products>  
     <product name="name31" value="value31" />g1  
     <product name="name32" value="value32" />  
 g2</products>  
 </allproducts>  

2. 修改testReadXmlDoc()

[cpp]view plaincopy 
    
 // 解析xmlPath路径的结点  
 void testReadXmlDoc(char *filepath, char *xmlPath)  
 {  
     xmlDocPtr doc = getdoc(filepath);  
     if(NULL == doc)  
         return ;  
   
     xmlChar *xpath = (xmlChar*) xmlPath;  
     xmlXPathObjectPtr result = getnodeset(doc, xpath);          // 获取结果集  
     if(result)  
     {  
         xmlNodeSetPtr nodeset = result->nodesetval;  
         xmlChar *name, *value;  
         printf("nodeset->nodeNr = %d\n", nodeset->nodeNr);        // 打印结果集中结点个数  
         for(int i = 0; i < nodeset->nodeNr; i++)  
         {  
             xmlNodePtr cur = nodeset->nodeTab[i];                // products  
             printf("cur->name = %s\n", cur->name);  
             cur = cur->xmlChildrenNode;  
             int ctext = 0;  
             while(cur)  
             {  
                 if(xmlStrcmp(cur->name, (const xmlChar*) "text"))        // cur->name不为"text"  
                 {  
                     printf("cur->name = %s\t", cur->name);  
                     name = xmlGetProp(cur, (const xmlChar*) "name");    // 获取属性值  
                     value = xmlGetProp(cur, (const xmlChar*) "value");  
                     printf("name = %s, value = %s\n", name, value);  
                     xmlFree(name);  
                     xmlFree(value);  
                 }  
                 else  
                 {  
                     ctext++;  
                     xmlChar *v = xmlNodeListGetString(doc, cur, 1);  
                     printf("cur->content = [%s], v = [%s]", cur->content, v); // cur->content获取cur的内容  
                     xmlFree(v);  
                 }  
                 cur = cur->next;  
             }  
             printf("ctext = %d\n", ctext);  
             printf("\n");  
         }  
         xmlXPathFreeObject(result);  
     }  
     xmlFreeDoc(doc);  
     xmlCleanupParser();  
 }  

运行结果：

[plain]view plaincopy 
    
 [zcm@tmp #168]$make  
 gcc  -o a a.c -I/usr/include/libxml2 -lxml2 -std=gnu99  
 [zcm@tmp #169]$./a  
 nodeset->nodeNr = 3  
 cur->name = products  
 cur->content = [h1  
     ], v = [h1  
     h2  
     h3  
     h4  
     h5  
   ]cur->name = product   name = name11, value = value11  
 cur->content = [h2  
     ], v = [h2  
     h3  
     h4  
     h5  
   ]cur->name = product   name = name12, value = value12  
 cur->content = [h3  
     ], v = [h3  
     h4  
     h5  
   ]cur->name = product   name = name13, value = value13  
 cur->content = [h4  
     ], v = [h4  
     h5  
   ]cur->name = product   name = name14, value = value14  
 cur->content = [h5  
   ], v = [h5  
   ]ctext = 5  
   
 cur->name = products  
 cur->content = [  
     ], v = [  
       
       
       
   ]cur->name = product   name = name21, value = value21  
 cur->content = [  
     ], v = [  
       
       
   ]cur->name = product   name = name22, value = value22  
 cur->content = [  
     ], v = [  
       
   ]cur->name = product   name = name23, value = value23  
 cur->content = [  
   ], v = [  
   ]ctext = 4  
   
 cur->name = products  
 cur->content = [  
     ], v = [  
     g1  
       
 g2]cur->name = product   name = name31, value = value31  
 cur->content = [g1  
     ], v = [g1  
       
 g2]cur->name = product   name = name32, value = value32  
 cur->content = [  
 g2], v = [  
 g2]ctext = 3  
   
 [zcm@tmp #170]$  

由此可见，一般情况下，我们用的比较多的可能会是cur->content这个东西了!

补充：

在网上看到一个人的写法，可以在解析xml文件时，直接忽略掉结点之间的无效空白。对于本文，就是将：

doc = xmlParseFile(docname);　－－－＞修改为：doc = xmlParseFile(docname, "UTF-8", XML_PARSE_NOBLANKS); // 第3个参数是关键

http://blog.csdn.net/joeblackzqq/article/details/7337093

GitHub 加速计划 / li / linux-dash

10.39 K

1.2 K

下载

A beautiful web dashboard for Linux

最近提交(Master分支：2 个月前 )

186a802e added ecosystem file for PM2 4 年前

5def40a3 Add host customization support for the NodeJS version 4 年前

GitCode 开源社区

旨在为数千万中国开发者提供一个无缝且高效的云端环境，以支持学习、使用和贡献开源项目。

更多推荐

[转载]在Windows环境下安装GNU Radio

转自：在Windows环境下安装GNURadio_恐弱智_新浪博客GNU Radio是用Python开发的，大部分开源的工程能够在Linux环境下运行良好，而Windows下却运行的很勉强，而且安装配置都很复杂。GNU Radio算是个例外了，不光提供了Windows的二进制安装，还有比较详细的说明。我是Python小白，所以折腾了好久才弄好，特意记录下来，免得以后再装还折腾。GNU Radio的

GitCode 开源社区

centOS 8 使用dnf安装Docker

DNF是什么？CentOS 8使用YUM软件包管理器版本v4.0.4。现在，该版本使用DNF(已删除YUM)。DNF是软件包管理器。它会在Linux发行版上安装，执行更新并删除软件包。使用DNF安装Docker跳过具有损坏依赖性的程序包一个有效的解决方案是使您的CentOS 8系统使用以下--nobest命令安装最符合条件的版本：sudo dnf install docker...

GitCode 开源社区

定时同步数据库表(mysql+linux+crontab)

sync.sh里面的参数需要改变，ip/username/password/database/tablesync.sh#!/bin/sh# Please change the IP and password of the data source db.# Then change the table name.filename=/home/nington/db/$(date +%Y-%m