Update of /cvsroot/htmlparser/htmlparser/src/org/htmlparser/lexer
In directory sc8-pr-cvs1.sourceforge.net:/tmp/cvs-serv2443/src/org/htmlparser/lexer
Modified Files:
Tag: v1_41
Page.java
Log Message:
Avoid bug #995703 Parser Crash and also #988846 Linkbean getLinks() segmentation fault
by not testing for content type "text/XXXX"
Index: Page.java
===================================================================
RCS file: /cvsroot/htmlparser/htmlparser/src/org/htmlparser/lexer/Page.java,v
retrieving revision 1.33
retrieving revision 1.33.2.1
diff -C2 -d -r1.33 -r1.33.2.1
*** Page.java 31 Jan 2004 20:51:01 -0000 1.33
--- Page.java 27 Jul 2004 11:15:23 -0000 1.33.2.1
***************
*** 336,344 ****
}
type = getContentType ();
! if (!type.startsWith ("text"))
! throw new ParserException (
! "URL "
! + connection.getURL ().toExternalForm ()
! + " does not contain text");
charset = getCharset (type);
try
--- 336,345 ----
}
type = getContentType ();
! // removed to avoid bug #995703 Parser Crash and also #988846 Linkbean getLinks() segmentation fault
! // if (!type.startsWith ("text"))
! // throw new ParserException (
! // "URL "
! // + connection.getURL ().toExternalForm ()
! // + " does not contain text");
charset = getCharset (type);
try
|