0

我已经看过很多关于这个的帖子,但实际上我没有得到任何工作。我正在构建一个简单的电视指南 android 应用程序。我只是使用来自 tvprofil.net 的 RSS 来显示今天电视上的内容。问题是,我不知道如何在 XML 中解析 CDATA。我正在使用一些带有 DOM 的标准解析器……至少我是这么认为的……

这是一点 XML:

.
.
.
<item>
<title>RTS1 14.08.2012</title>
<pubDate>Tue, 14 Aug 2012 06:00:00</pubDate>
<content:encoded><![CDATA[06:00 Vesti<br>06:05 Jutarnji program<br>08:00 Dnevnik
<br>8:15 Jutarnji Program<br>09:00 Vesti ... ]]></content:encoded>
</item>
.
.
.

现在,这是我的主要应用程序:

public class Main extends ListActivity {

// All static variables
static final String URL = "http://tvprofil.net/rss/feed/channel-group-2.xml";
// XML node keys
static final String KEY_ITEM = "item"; // parent node
static final String KEY_NAME = "title";
static final String KEY_DATE = "pubDate";
static final String KEY_DESC = "content:encoded";

@Override
public void onCreate(Bundle savedInstanceState) {
    super.onCreate(savedInstanceState);
    setContentView(R.layout.activity_main);


    ArrayList<HashMap<String,String>> menuItems = new ArrayList<HashMap<String,String>>();



    XMLParser parser = new XMLParser();
    String xml = parser.getXmlFromUrl(URL); //get XML
    Document doc = parser.getDomElement(xml); // get DOM elem.



    NodeList nl = doc.getElementsByTagName(KEY_ITEM);
    //loop
    for (int i=0; i< nl.getLength(); i++){
        HashMap<String, String> map = new HashMap<String, String>();
        Element e = (Element) nl.item(i);
        //add to map
        map.put(KEY_NAME, parser.getValue(e, KEY_NAME));
        map.put(KEY_DATE, parser.getValue(e, KEY_DATE));
        map.put(KEY_DESC, parser.getValue(e, KEY_DESC));

        // hash => list
        menuItems.add(map);
    }

    ListAdapter adapter = new SimpleAdapter(this, menuItems, R.layout.list_item,
            new String[]{KEY_NAME, KEY_DESC, KEY_DATE}, new int[]{
            R.id.name, R.id.description, R.id.date
    });
    setListAdapter(adapter);

    //singleView
    ListView lv = getListView();

    lv.setOnItemClickListener(new OnItemClickListener(){
        @Override
        public void onItemClick(AdapterView<?> parent, View view, int position, long id){
            String name = ((TextView)view.findViewById(R.id.name)).getText().toString();
            String date = ((TextView)view.findViewById(R.id.date)).getText().toString();
            String description = ((TextView)view.findViewById(R.id.description)).getText().toString();

            //intent
            Intent in = new Intent(getApplicationContext(), SingleMenuItemActivity.class);
            in.putExtra(KEY_NAME, name);
            in.putExtra(KEY_DATE, date);
            in.putExtra(KEY_DESC, description);
            startActivity(in);
        }
    });

}

}

和解析器类:

public class XMLParser {

// constructor
public XMLParser() {

}

/**
 * Getting XML from URL making HTTP request
 * @param url string
 * */
public String getXmlFromUrl(String url) {
    String xml = null;


    try {
        // defaultHttpClient
        DefaultHttpClient httpClient = new DefaultHttpClient();
        HttpPost httpPost = new HttpPost(url);

        HttpResponse httpResponse = httpClient.execute(httpPost);
        HttpEntity httpEntity = httpResponse.getEntity();
        xml = EntityUtils.toString(httpEntity);

    } catch (UnsupportedEncodingException e) {
        e.printStackTrace();
    } catch (ClientProtocolException e) {
        e.printStackTrace();
    } catch (IOException e) {
        e.printStackTrace();
    }
    // return XML
    return xml;
}

/**
 * Getting XML DOM element
 * @param XML string
 * */

public Document getDomElement(String xml){

    Document doc = null;
    DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance();
    try {

        DocumentBuilder db = dbf.newDocumentBuilder();

        InputSource is = new InputSource();
            is.setCharacterStream(new StringReader(xml));
            doc = db.parse(is); 

        } catch (ParserConfigurationException e) {
            Log.e("Error: ", e.getMessage());
            return null;
        } catch (SAXException e) {
            Log.e("Error: ", e.getMessage());
            return null;
        } catch (IOException e) {
            Log.e("Error: ", e.getMessage());
            return null;
        }

        return doc;
}

/** Getting node value
  * @param elem element
  */
 public final String getElementValue( Node elem ) {

     Node child;
     if( elem != null){
         if (elem.hasChildNodes()){
             for( child = elem.getFirstChild(); child != null; child = child.getNextSibling() ){
                 if( child.getNodeType() == Node.TEXT_NODE  ){
                     return child.getNodeValue();
                 }
             }
         }
     }
     return "";
 }

 /**
  * Getting node value
  * @param Element node
  * @param key string
  * */
 public String getValue(Element item, String str) {     
        NodeList n = item.getElementsByTagName(str);        
        return this.getElementValue(n.item(0));
    }
}

Single menu item 还有一个类..但我认为在这种情况下它是无关紧要的。现在,我只想在解析它并处理 CDATA 之后看不到 HTML 标签……有人知道这个吗?

4

4 回答 4

2

添加这个

 dbf.setCoalescing(true); 

dbf 在哪里

DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance();
于 2012-08-14T10:53:21.170 回答
1
  1. 先添加这个方法

    public String getCharacterDataFromElement(Element e, String str) {
    NodeList n = e.getElementsByTagName(str);   
    Element e1=(Element) n.item(0);
    
    Node child = e1.getFirstChild();
    if (child instanceof CharacterData) {
      CharacterData cd = (CharacterData) child;
      return cd.getData();
    }
    return "";
    }
    
  2. 像这样调用上述方法-

    map.put(KEY_DESC, parser.getCharacterDataFromElement(e, KEY_DESC));
    

这应该为您提供字符串格式的 CDATA。希望这可以帮助

于 2013-10-11T13:22:39.690 回答
0

当我需要从一组“描述”xml 元素中的 CDATA 中提取图像 URL 时,zg_spring 的答案对我来说非常有效:

//Get the content of all "item" elements    
DocumentBuilder db = DocumentBuilderFactory.newInstance().newDocumentBuilder();
Document doc = db.parse(new InputSource(new StringReader(xml)));
NodeList nlDetails = doc.getElementsByTagName("item");    

//Loop through elements and extract content of "description" elements    
for(int k = 0; k < numDetails; k++) {
    Element nDetails = (Element)nlDetails.item(k);
    NodeList nlCoverURL = nDetails.getElementsByTagName("description");         
    Node nCoverURL = nlCoverURL.item(0);
    String sCoverURL = nCoverURL.getTextContent();

    //Isolate the relevant part of the String and load it into an ArrayList
    String[] descriptionContent = sCoverURL.split("\"");
    String s = descriptionContent[11]
    alImages.add(s);
} 
于 2013-04-24T02:37:49.750 回答
0

获取文本内容。此属性返回此节点及其后代的文本内容

getNodeValue() 这个节点的值,取决于它的类型;

通常你应该使用 getTextContent。

于 2012-12-11T02:35:02.423 回答