Menu

why I can not parse this page-thanks a lot

Help
SpencerWHJ
2004-10-11
2013-04-27
  • SpencerWHJ

    SpencerWHJ - 2004-10-11

    The code is in the following list:

    import java.util.ArrayList;
    import java.util.List;

    import org.htmlparser.Node;
    import org.htmlparser.NodeFilter;
    import org.htmlparser.Parser;
    import org.htmlparser.filters.NodeClassFilter;
    import org.htmlparser.parserapplications.StringExtractor;
    import org.htmlparser.tags.FrameTag;
    import org.htmlparser.util.ParserException;

    /*
    * This is a bean that holds information about a web page
    */
    public class TimeReader {

       private String URL;

       public TimeReader(String URL) {
          setURL(URL);
       }

       public void setURL(String URL) {
          this.URL = URL;
       }

       public static void main(String[] args){
     
        TimeReader tr = new TimeReader("http://www.time.com/time/election2004/article/0,18471,709071,00.html");
        tr.process();
     
      }
       /*
        * Use the HTMLParser to parse a HTML Page
        */
       public void process() {
          StringExtractor se = new StringExtractor (URL);
          String contents = null;
          try {
             contents = se.extractStrings(true);
             System.out.println(contents);
          } catch (ParserException e) {
             e.printStackTrace();
             return;
          }

          }
       }
    }

    The error code:

    Exception in thread "main" java.lang.NullPointerException
            at org.htmlparser.beans.StringBean.visitTag(StringBean.java:645)
            at org.htmlparser.nodes.TagNode.accept(TagNode.java:775)
            at org.htmlparser.tags.CompositeTag.accept(CompositeTag.java:439)
            at org.htmlparser.tags.CompositeTag.accept(CompositeTag.java:435)
            at org.htmlparser.tags.CompositeTag.accept(CompositeTag.java:435)
            at org.htmlparser.Parser.visitAllNodesWith(Parser.java:752)
            at org.htmlparser.beans.StringBean.setStrings(StringBean.java:318)
            at org.htmlparser.beans.StringBean.setURL(StringBean.java:484)
            at org.htmlparser.parserapplications.StringExtractor.extractStrings(Stri
    ngExtractor.java:64)

     

Log in to post a comment.

Want the latest updates on software, tech news, and AI?
Get latest updates about software, tech news, and AI from SourceForge directly in your inbox once a month.