在java中使用SAX解析XML

发布于 2024-12-11 15:14:42 字数 6679 浏览 0 评论 0原文

我有这段代码来解析 XML 数据。

但是,当调用 startelement 和 endelement 函数时,它们在绑定打印参数值时不会获取参数值(因为 name 参数没有任何数据)。它没有任何价值,为什么?

我在下面的代码中调用 updateArticle 函数

import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;

import javax.xml.parsers.ParserConfigurationException;
import javax.xml.parsers.SAXParser;
import javax.xml.parsers.SAXParserFactory;

import org.xml.sax.Attributes;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.DefaultHandler;


    public class RSSHandler extends DefaultHandler {

            // Used to define what elements we are currently in
            private boolean inItem = false;
            private boolean inTitle = false;
            private boolean inLink = false;

            // Feed and Article objects to use for temporary storage
            private Article currentArticle = new Article();
            private Feed currentFeed = new Feed();

            // Number of articles added so far
            private int articlesAdded = 0;

            private ArrayList<Article> articles = new ArrayList<Article>(); 
            private ArrayList<Feed> feeds = new ArrayList<Feed>(); 
            // Number of articles to download
            private static final int ARTICLES_LIMIT = 15;

            // The possible values for targetFlag
            private static final int TARGET_FEED = 0;
            private static final int TARGET_ARTICLES = 1;

            // A flag to know if looking for Articles or Feed name
            private int targetFlag;


            public RSSHandler(){ }
            public void startElement(String uri, String name, String qName,Attributes atts) {
                    if (name.trim().equals("title"))
                            inTitle = true;
                    else if (name.trim().equals("item"))
                            inItem = true;
                    else if (name.trim().equals("link"))
                            inLink = true;
                    System.out.println(name.trim());
            }

            public void endElement(String uri, String name, String qName)throws SAXException {
                    if (name.trim().equals("title"))
                            inTitle = false;
                    else if (name.trim().equals("item"))
                            inItem = false;
                    else if (name.trim().equals("link"))
                            inLink = false;

                    // Check if looking for feed, and if feed is complete
                    if (targetFlag == TARGET_FEED && currentFeed.url != null && currentFeed.title != null) {
                            // We know everything we need to know, so insert feed and exit
                            System.out.println("add current feed");
                            feeds.add(currentFeed);
                         //   throw new SAXException();
                    }

                    // Check if looking for article, and if article is complete
                    if (targetFlag == TARGET_ARTICLES && currentArticle.url != null && currentArticle.title != null) {

                            Article article = new Article();
                            article.feedId = currentFeed.id;
                            article.title = currentArticle.title;
                            article.url = currentArticle.url;
                            System.out.print(article.title);
                            articles.add(article);

                            //store articles in database

                            currentArticle.title = null;
                            currentArticle.url = null;

                            // Lets check if we've hit our limit on number of articles
                            articlesAdded++;
                            if (articlesAdded >= ARTICLES_LIMIT)
                                    throw new SAXException();
                    }

            }
            public ArrayList<Article> getArticles(){
                return this.articles;
            }            
            public ArrayList<Feed> getFeeds(){
                return this.feeds;
            }
            public void characters(char ch[], int start, int length) {

                    String chars = (new String(ch).substring(start, start + length));
                    System.out.println(chars);
                    try {
                            // If not in item, then title/link refers to feed
                            if (!inItem) {
                                    if (inTitle)
                                            currentFeed.title = chars;

                            } else {

                                    if (inLink)
                                            currentArticle.url = new URL(chars);
                                    if (inTitle)
                                            currentArticle.title = chars;

                            }
                    } catch (MalformedURLException e) {
                    }

            }

            public void createFeed(URL url) {
                    try {
                            targetFlag = TARGET_FEED;
                            currentFeed.url = url;

                            SAXParserFactory spf = SAXParserFactory.newInstance();
                            SAXParser sp = spf.newSAXParser();
                            XMLReader xr = sp.getXMLReader();
                            xr.setContentHandler(this);
                            xr.parse(new InputSource(url.openStream()));

                    } catch (IOException e) {}
                    catch (SAXException e) {} 
                    catch (ParserConfigurationException e) {}
            }

            public void updateArticles(Feed feed) {
                    try {
                            targetFlag = TARGET_ARTICLES;
                            currentFeed = feed;
                            System.out.println(feed.url.toString());
                            SAXParserFactory spf = SAXParserFactory.newInstance();
                            SAXParser sp = spf.newSAXParser();
                            XMLReader xr = sp.getXMLReader();
                            xr.setContentHandler(this);
                            xr.parse(new InputSource(currentFeed.url.openStream()));

                    } catch (IOException e) {} 
                    catch (SAXException e) {} 
                    catch (ParserConfigurationException e) {}
            }

    }

I have this code to parse XML data ..

But when startelement and endelement functions are called they don't get the parameters values ( as name parameter don't have any data ) when tying to print the parameters values. it dont't have any value, why ?

I call updateArticle function in the following code

import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;

import javax.xml.parsers.ParserConfigurationException;
import javax.xml.parsers.SAXParser;
import javax.xml.parsers.SAXParserFactory;

import org.xml.sax.Attributes;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.DefaultHandler;


    public class RSSHandler extends DefaultHandler {

            // Used to define what elements we are currently in
            private boolean inItem = false;
            private boolean inTitle = false;
            private boolean inLink = false;

            // Feed and Article objects to use for temporary storage
            private Article currentArticle = new Article();
            private Feed currentFeed = new Feed();

            // Number of articles added so far
            private int articlesAdded = 0;

            private ArrayList<Article> articles = new ArrayList<Article>(); 
            private ArrayList<Feed> feeds = new ArrayList<Feed>(); 
            // Number of articles to download
            private static final int ARTICLES_LIMIT = 15;

            // The possible values for targetFlag
            private static final int TARGET_FEED = 0;
            private static final int TARGET_ARTICLES = 1;

            // A flag to know if looking for Articles or Feed name
            private int targetFlag;


            public RSSHandler(){ }
            public void startElement(String uri, String name, String qName,Attributes atts) {
                    if (name.trim().equals("title"))
                            inTitle = true;
                    else if (name.trim().equals("item"))
                            inItem = true;
                    else if (name.trim().equals("link"))
                            inLink = true;
                    System.out.println(name.trim());
            }

            public void endElement(String uri, String name, String qName)throws SAXException {
                    if (name.trim().equals("title"))
                            inTitle = false;
                    else if (name.trim().equals("item"))
                            inItem = false;
                    else if (name.trim().equals("link"))
                            inLink = false;

                    // Check if looking for feed, and if feed is complete
                    if (targetFlag == TARGET_FEED && currentFeed.url != null && currentFeed.title != null) {
                            // We know everything we need to know, so insert feed and exit
                            System.out.println("add current feed");
                            feeds.add(currentFeed);
                         //   throw new SAXException();
                    }

                    // Check if looking for article, and if article is complete
                    if (targetFlag == TARGET_ARTICLES && currentArticle.url != null && currentArticle.title != null) {

                            Article article = new Article();
                            article.feedId = currentFeed.id;
                            article.title = currentArticle.title;
                            article.url = currentArticle.url;
                            System.out.print(article.title);
                            articles.add(article);

                            //store articles in database

                            currentArticle.title = null;
                            currentArticle.url = null;

                            // Lets check if we've hit our limit on number of articles
                            articlesAdded++;
                            if (articlesAdded >= ARTICLES_LIMIT)
                                    throw new SAXException();
                    }

            }
            public ArrayList<Article> getArticles(){
                return this.articles;
            }            
            public ArrayList<Feed> getFeeds(){
                return this.feeds;
            }
            public void characters(char ch[], int start, int length) {

                    String chars = (new String(ch).substring(start, start + length));
                    System.out.println(chars);
                    try {
                            // If not in item, then title/link refers to feed
                            if (!inItem) {
                                    if (inTitle)
                                            currentFeed.title = chars;

                            } else {

                                    if (inLink)
                                            currentArticle.url = new URL(chars);
                                    if (inTitle)
                                            currentArticle.title = chars;

                            }
                    } catch (MalformedURLException e) {
                    }

            }

            public void createFeed(URL url) {
                    try {
                            targetFlag = TARGET_FEED;
                            currentFeed.url = url;

                            SAXParserFactory spf = SAXParserFactory.newInstance();
                            SAXParser sp = spf.newSAXParser();
                            XMLReader xr = sp.getXMLReader();
                            xr.setContentHandler(this);
                            xr.parse(new InputSource(url.openStream()));

                    } catch (IOException e) {}
                    catch (SAXException e) {} 
                    catch (ParserConfigurationException e) {}
            }

            public void updateArticles(Feed feed) {
                    try {
                            targetFlag = TARGET_ARTICLES;
                            currentFeed = feed;
                            System.out.println(feed.url.toString());
                            SAXParserFactory spf = SAXParserFactory.newInstance();
                            SAXParser sp = spf.newSAXParser();
                            XMLReader xr = sp.getXMLReader();
                            xr.setContentHandler(this);
                            xr.parse(new InputSource(currentFeed.url.openStream()));

                    } catch (IOException e) {} 
                    catch (SAXException e) {} 
                    catch (ParserConfigurationException e) {}
            }

    }

如果你对这篇内容有疑问,欢迎到本站社区发帖提问 参与讨论,获取更多帮助,或者扫码二维码加入 Web 技术交流群。

扫码二维码加入Web技术交流群

发布评论

需要 登录 才能够评论, 你可以免费 注册 一个本站的账号。

评论(2

不必在意 2024-12-18 15:14:42

JAXP 中最令人震惊的设计决策之一(有很多)是 SAXParserFactory 默认情况下创建一个不支持名称空间的解析器。始终在返回的解析器上调用 setNamespaceAware(true)。否则,XMLReader 将使用为非命名空间感知解析器定义的选项来调用 startElement,这意味着它将提供词法 QName,但不提供本地名称和 URI。

One of the most appalling design decisions in JAXP (and there were many) was that SAXParserFactory by default creates a parser that is not namespace-aware. Always call setNamespaceAware(true) on the returned parser. Otherwise, the XMLReader will call startElement using the options defined for a non-namespace-aware parser, which means it will supply the lexical QName, but not the local-name and URI.

谎言 2024-12-18 15:14:42

qName 参数包含元素名称。

这是一个示例尽管由于格式的原因很难阅读。

命名空间等对获取元素名称的位置/方式产生影响。

The qName parameter contains the element name.

Here's an example although it's hard to read because of formatting.

Namespacing etc. makes a difference in where/how to get at element names.

~没有更多了~
我们使用 Cookies 和其他技术来定制您的体验包括您的登录状态等。通过阅读我们的 隐私政策 了解更多相关信息。 单击 接受 或继续使用网站,即表示您同意使用 Cookies 和您的相关数据。
原文