Revision: 2746
http://archive-access.svn.sourceforge.net/archive-access/?rev=2746&view=rev
Author: binzino
Date: 2009-06-25 20:23:20 +0000 (Thu, 25 Jun 2009)
Log Message:
-----------
WAX-49, WAX-50: Added -h and -n options to specify number of hits-per-site and total number of hits requested.
Modified Paths:
--------------
tags/nutchwax-0_12_5/archive/src/java/org/archive/nutchwax/NutchWaxBean.java
Modified: tags/nutchwax-0_12_5/archive/src/java/org/archive/nutchwax/NutchWaxBean.java
===================================================================
--- tags/nutchwax-0_12_5/archive/src/java/org/archive/nutchwax/NutchWaxBean.java 2009-06-25 20:21:51 UTC (rev 2745)
+++ tags/nutchwax-0_12_5/archive/src/java/org/archive/nutchwax/NutchWaxBean.java 2009-06-25 20:23:20 UTC (rev 2746)
@@ -251,28 +251,59 @@
*/
public static void main(String[] args) throws Exception
{
- String usage = "NutchWaxBean query";
+ String usage = "NutchWaxBean [options] query"
+ + "\n\t-h <n> Hits per site"
+ + "\n\t-n <n> Number of results to find"
+ + "\n";
- if (args.length == 0)
+ if ( args.length == 0 )
{
- System.err.println(usage);
- System.exit(-1);
+ System.err.println( usage );
+ System.exit( -1 );
}
+
+ String queryString = args[args.length - 1];
+ int hitsPerSite = 0;
+ int numHits = 10;
+ for ( int i = 0 ; i < args.length - 1 ; i++ )
+ {
+ try
+ {
+ if ( "-h".equals( args[i] ) )
+ {
+ i++;
+ hitsPerSite = Integer.parseInt( args[i] );
+ }
+ if ( "-n".equals( args[i] ) )
+ {
+ i++;
+ numHits = Integer.parseInt( args[i] );
+ }
+ }
+ catch ( NumberFormatException nfe )
+ {
+ System.err.println( "Error: not a numeric value: " + args[i] );
+ System.err.println( usage );
+ System.exit( -1 );
+ }
+ }
Configuration conf = NutchConfiguration.create();
NutchBean bean = new NutchBean(conf);
NutchBeanModifier.modify( bean );
- Query query = Query.parse(args[0], conf);
- Hits hits = bean.search(query, 10);
- System.out.println("Total hits: " + hits.getTotal());
- int length = (int)Math.min(hits.getTotal(), 10);
+ Query query = Query.parse(queryString, conf);
+ System.out.println("Hits per site: " + hitsPerSite);
+ Hits hits = bean.search(query, numHits, hitsPerSite);
+ System.out.println("Total hits : " + hits.getTotal());
+ System.out.println("Hits length: " + hits.getLength());
+ int length = (int)Math.min(hits.getLength(), numHits);
Hit[] show = hits.getHits(0, length);
HitDetails[] details = bean.getDetails(show);
Summary[] summaries = bean.getSummary(details, query);
- for (int i = 0; i < hits.getLength(); i++)
+ for (int i = 0; i < length; i++)
{
// Use a slightly more verbose output than NutchBean.
System.out.println( " "
This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site.
|