This is the exception I get when trying the same page with htmlunit2.10 jars, please note this works fine with htmlunit2.9 jars:
[27 Oct 2012 - 16:42:27] DEBUG [com.mypkg.MyClass] - IOException when loading India New Delhi airport arrival page
java.util.zip.ZipException: unknown compression method
at java.util.zip.InflaterInputStream.read(InflaterInputStream.java:147)
at org.cyberneko.html.HTMLScanner$PlaybackInputStream.read(HTMLScanner.java:3511)
at sun.nio.cs.StreamDecoder.readBytes(StreamDecoder.java:264)
at sun.nio.cs.StreamDecoder.implRead(StreamDecoder.java:306)
at sun.nio.cs.StreamDecoder.read(StreamDecoder.java:158)
at java.io.InputStreamReader.read(InputStreamReader.java:167)
at org.cyberneko.html.HTMLScanner$CurrentEntity.load(HTMLScanner.java:1814)
at org.cyberneko.html.HTMLScanner$CurrentEntity.read(HTMLScanner.java:1835)
at org.cyberneko.html.HTMLScanner$ContentScanner.scan(HTMLScanner.java:2000)
at org.cyberneko.html.HTMLScanner.scanDocument(HTMLScanner.java:917)
at org.cyberneko.html.HTMLConfiguration.parse(HTMLConfiguration.java:499)
at org.cyberneko.html.HTMLConfiguration.parse(HTMLConfiguration.java:452)
at org.apache.xerces.parsers.XMLParser.parse(Unknown Source)
at com.gargoylesoftware.htmlunit.html.HTMLParser$HtmlUnitDOMBuilder.parse(HTMLParser.java:798)
at com.gargoylesoftware.htmlunit.html.HTMLParser.parse(HTMLParser.java:234)
at com.gargoylesoftware.htmlunit.html.HTMLParser.parseHtml(HTMLParser.java:180)
at com.gargoylesoftware.htmlunit.DefaultPageCreator.createHtmlPage(DefaultPageCreator.java:267)
at com.gargoylesoftware.htmlunit.DefaultPageCreator.createPage(DefaultPageCreator.java:155)
at com.gargoylesoftware.htmlunit.WebClient.loadWebResponseInto(WebClient.java:440)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:315)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:380)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:365)
at com.mypkg.FSScraper.ScrapeCity(FSScraper.java:40)
at com.mypkg.FSScraper.ScrapeAll(FSScraper.java:121)
at com.mypkg.CronJob$1.run(CronJob.java:52)
at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:441)
at java.util.concurrent.FutureTask$Sync.innerRunAndReset(FutureTask.java:317)
at java.util.concurrent.FutureTask.runAndReset(FutureTask.java:150)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.access$101(ScheduledThreadPoolExecutor.java:98)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.runPeriodic(ScheduledThreadPoolExecutor.java:181)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:205)
at java.util.concurrent.ThreadPoolExecutor$Worker.runTask(ThreadPoolExecutor.java:886)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:908)
at java.lang.Thread.run(Thread.java:619)
If you would like to refer to this comment somewhere else in this project, copy and paste the following link:
Did another try with the latest snapshot and the page works fine.
So please use the latest snapshot (http://build.canoo.com/htmlunit/artifacts/) and open a new bug if you still have problems.
If you would like to refer to this comment somewhere else in this project, copy and paste the following link:
I don't see any errors, please try with latest snapshot from http://build.canoo.com/htmlunit/artifacts/
Also, try to isolate a minimal test case.
This is the exception I get when trying the same page with htmlunit2.10 jars, please note this works fine with htmlunit2.9 jars:
[27 Oct 2012 - 16:42:27] DEBUG [com.mypkg.MyClass] - IOException when loading India New Delhi airport arrival page
java.util.zip.ZipException: unknown compression method
at java.util.zip.InflaterInputStream.read(InflaterInputStream.java:147)
at org.cyberneko.html.HTMLScanner$PlaybackInputStream.read(HTMLScanner.java:3511)
at sun.nio.cs.StreamDecoder.readBytes(StreamDecoder.java:264)
at sun.nio.cs.StreamDecoder.implRead(StreamDecoder.java:306)
at sun.nio.cs.StreamDecoder.read(StreamDecoder.java:158)
at java.io.InputStreamReader.read(InputStreamReader.java:167)
at org.cyberneko.html.HTMLScanner$CurrentEntity.load(HTMLScanner.java:1814)
at org.cyberneko.html.HTMLScanner$CurrentEntity.read(HTMLScanner.java:1835)
at org.cyberneko.html.HTMLScanner$ContentScanner.scan(HTMLScanner.java:2000)
at org.cyberneko.html.HTMLScanner.scanDocument(HTMLScanner.java:917)
at org.cyberneko.html.HTMLConfiguration.parse(HTMLConfiguration.java:499)
at org.cyberneko.html.HTMLConfiguration.parse(HTMLConfiguration.java:452)
at org.apache.xerces.parsers.XMLParser.parse(Unknown Source)
at com.gargoylesoftware.htmlunit.html.HTMLParser$HtmlUnitDOMBuilder.parse(HTMLParser.java:798)
at com.gargoylesoftware.htmlunit.html.HTMLParser.parse(HTMLParser.java:234)
at com.gargoylesoftware.htmlunit.html.HTMLParser.parseHtml(HTMLParser.java:180)
at com.gargoylesoftware.htmlunit.DefaultPageCreator.createHtmlPage(DefaultPageCreator.java:267)
at com.gargoylesoftware.htmlunit.DefaultPageCreator.createPage(DefaultPageCreator.java:155)
at com.gargoylesoftware.htmlunit.WebClient.loadWebResponseInto(WebClient.java:440)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:315)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:380)
at com.gargoylesoftware.htmlunit.WebClient.getPage(WebClient.java:365)
at com.mypkg.FSScraper.ScrapeCity(FSScraper.java:40)
at com.mypkg.FSScraper.ScrapeAll(FSScraper.java:121)
at com.mypkg.CronJob$1.run(CronJob.java:52)
at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:441)
at java.util.concurrent.FutureTask$Sync.innerRunAndReset(FutureTask.java:317)
at java.util.concurrent.FutureTask.runAndReset(FutureTask.java:150)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.access$101(ScheduledThreadPoolExecutor.java:98)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.runPeriodic(ScheduledThreadPoolExecutor.java:181)
at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:205)
at java.util.concurrent.ThreadPoolExecutor$Worker.runTask(ThreadPoolExecutor.java:886)
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:908)
at java.lang.Thread.run(Thread.java:619)
any updates?
Did another try with the latest snapshot and the page works fine.
So please use the latest snapshot (http://build.canoo.com/htmlunit/artifacts/) and open a new bug if you still have problems.