0

快速提问:

如果我有这样的 XML:

<?xml version="1.0" encoding="utf-8"?>
<cop xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="cop.xsd">
    <auth>
        <uid mioattributo="20">16<![CDATA[
function matchwo(a,b) ]]></uid>
    </auth>
</cop>

所以uid有两个孩子吧?之一Node.CDATA_SECTION_NODE和之一Node.TEXT_NODE

实现这个快速类(扩展通常的 DefaultHandler):

public class MyHandler extends DefaultHandler {
    /**
     * Logger for this class
     */
    private static final Log log = LogFactory.getLog(MyHandler.class);
    private StringBuilder sb;

    @Override
    public void startElement(String uri, String localName, String qName,
        Attributes attributes) throws SAXException {
    System.out.println("STARTUri: " + uri);
    System.out.println("STARTLocalName: " + localName);
    System.out.println("STARTqName: " + qName);
//  for(int i=0;i<attributes.getLength();i++) {
//      System.out.println("LocalName: "+attributes.getLocalName(i));
//      System.out.println("Type: "+attributes.getType(i));
//      System.out.println("qName: "+attributes.getQName(i));
//      System.out.println("URI: "+attributes.getURI(i));
//      System.out.println("Value: "+attributes.getValue(i));
//  }
    sb = new StringBuilder();
    //super.startElement(uri, localName, qName, attributes);
    }

    @Override
    public void characters(char[] ch, int start, int length)
            throws SAXException {
    sb.append(ch, start, length);
    System.out.println("TEMPORARY: " + sb.toString());
    System.out.println();
    }

    @Override
    public void endElement(String uri, String localName, String qName)
            throws SAXException {
    System.out.println("ENDUri: " + uri);
    System.out.println("ENDLocalName: " + localName);
    System.out.println("ENDqName: " + qName);
    System.out.println("Content: " + sb.toString());
    sb.replace(0, sb.length()-1,"");
    }

}

输出的解析将类似于:

Is Validating: true
STARTUri: 
STARTLocalName: cop
STARTqName: cop
TEMPORARY: 


STARTUri: 
STARTLocalName: auth
STARTqName: auth
TEMPORARY: 


STARTUri: 
STARTLocalName: uid
STARTqName: uid
TEMPORARY: 16

TEMPORARY: 16
function matchwo(a,b) 

ENDUri: 
ENDLocalName: uid
ENDqName: uid
Content: 16
function matchwo(a,b) 
TEMPORARY:  


ENDUri: 
ENDLocalName: auth
ENDqName: auth
Content:  

TEMPORARY:  


ENDUri: 
ENDLocalName: cop
ENDqName: cop
Content:    

从输出中我们可以看到该方法characters()在节点内被调用了两次,uid因此它可以识别两个孩子。有没有办法知道哪个是 CDATA 哪个是 TEXT?

4

1 回答 1

3

您应该查看告诉您有关 CDATA 开始/结束的LexicalHandler 。

请注意,SAX 解析器可以characters()根据需要随意多次(或尽可能少地)调用您的方法,以便您构建一个字符串(只有在endElement()被调用时才知道它是完整的),而您不能依靠它来确定文档结构。

于 2012-08-01T16:25:07.233 回答