libxml:从 xmlTextReaderPtr 构建 DOM 树,处理命名空间
我正在尝试从 DOM 树 /xmlsoft.org/html/libxml-xmlreader.html" rel="nofollow">xmlTextReaderPtr。在我的最终程序中,它将用于使用大型 XML 文件中的 xslt 处理小型 DOM 树,例如
#include <stdio.h>
#include <libxml/parser.h>
#include <libxml/tree.h>
#include <libxml/xmlreader.h>
/* dump XML node */
static void print_element_names(xmlNode * a_node)
{
xmlNode *cur_node = NULL;
for (cur_node = a_node; cur_node; cur_node = xmlNextElementSibling(cur_node))
{
if (cur_node->type == XML_ELEMENT_NODE)
{
xmlAttrPtr attr;
printf("node type: Element, name: %s", cur_node->name);
if(cur_node->ns!=0 && cur_node->ns->href!=0) printf(" with namespace: %s", cur_node->ns->href);
printf("\n");
for(attr = cur_node->properties; NULL != attr; attr = attr->next)
{
xmlChar* v=xmlGetProp( cur_node,attr->name);
printf(" @%s=%s ", attr->name,v);
xmlFree(v);
}
}
print_element_names(cur_node->children);
}
}
int main(int argc,char** argv)
{
LIBXML_TEST_VERSION;
xmlTextReaderPtr reader;
xmlDocPtr doc = NULL;
xmlNodePtr current=NULL;
xmlNsPtr ns=NULL;
/* read from stdin */
reader=xmlReaderForFd(fileno(stdin),0,"UTF-8",0);
for(;;)
{
int nodeType;
int ret = xmlTextReaderRead(reader);
if(ret<=0) break;
nodeType=xmlTextReaderNodeType(reader);
switch(nodeType)
{
case XML_READER_TYPE_ELEMENT:
{
xmlNsPtr ns=0;
xmlNodePtr node;
if(doc==NULL)
{
doc=xmlNewDoc( BAD_CAST "1.0");
}
if(xmlTextReaderConstNamespaceUri(reader)!=0)
{
/** how should I handle the attributes' namespaces & prefix here ? */
xmlNsPtr ns=xmlSearchNs(doc,current,xmlTextReaderConstNamespaceUri(reader));
node=xmlNewNode(ns, xmlTextReaderConstName(reader));
if(ns==0)
{
ns=xmlNewNs(node,
xmlTextReaderConstPrefix(reader),
xmlTextReaderConstNamespaceUri(reader)
);
}
}
else
{
node=xmlNewNode(0, xmlTextReaderConstName(reader));
}
if(current==NULL)
{
xmlDocSetRootElement(doc,node);
}
else
{
xmlAddChild(current,node);
}
current=node;
if(xmlTextReaderIsEmptyElement(reader))
{
current= current->parent;
}
if(xmlTextReaderHasAttributes(reader))
{
int i;
int n_att=xmlTextReaderAttributeCount(reader);
for(i=0;i< n_att;++i)
{
const xmlChar* k;
xmlChar* v;
xmlTextReaderMoveToAttributeNo(reader,i);
k = xmlTextReaderConstName(reader);
v = xmlTextReaderValue(reader);
/** how should I handle the attributes' namespaces & prefix here ? */
xmlNewProp(node,k, v);
xmlFree(v);
}
xmlTextReaderMoveToElement(reader);
}
break;
}
case XML_READER_TYPE_END_ELEMENT:
{
current= current->parent;
break;
}
case XML_READER_TYPE_SIGNIFICANT_WHITESPACE:
case XML_READER_TYPE_TEXT:
{
const xmlChar* v = xmlTextReaderConstValue(reader);
xmlNodePtr node= xmlNewDocText(doc,v);
xmlAddChild(current,node);
break;
}
default:
{
fprintf(stderr,"Ignoring node Type %d\n",nodeType);
break;
}
}
}
if(doc!=NULL)
{
print_element_names(xmlDocGetRootElement(doc));
xmlDocDump(stderr,doc);
xmlFreeDoc(doc);
}
xmlFreeTextReader(reader);
xmlCleanupParser();
xmlMemoryDump();
return 0;
}
这是我的测试文件:
<?xml version="1.0"?>
<a xmlns="http://urn1.org" xmlns:ns1="http://urn2.org" ns1:test="ok">azdazd
<b xmlns:ns2="http://urn3.org" xmlns:ns3="http://urn4.org" ns3:test="OK"/>
azd
<ns1:b test="ok"/>
xaz
</a>
非常感谢,
如果你对这篇内容有疑问,欢迎到本站社区发帖提问 参与讨论,获取更多帮助,或者扫码二维码加入 Web 技术交流群。
绑定邮箱获取回复消息
由于您还没有绑定你的真实邮箱,如果其他用户或者作者回复了您的评论,将不能在第一时间通知您!
发布评论
评论(1)
好的,我已经找到了我的错误以及如何使用 API。这是代码:
Ok, I've found my erros and how to use the API. Here is the code: