Revision: 3387
          http://archive-access.svn.sourceforge.net/archive-access/?rev=3387&view=rev
Author:   bradtofel
Date:     2011-02-06 14:31:04 +0000 (Sun, 06 Feb 2011)
Log Message:
-----------
added tests for real-world examples
Modified Paths:
--------------
    trunk/archive-access/projects/wayback/wayback-core/src/test/java/org/archive/wayback/accesscontrol/staticmap/StaticMapExclusionFilterTest.java
Modified: trunk/archive-access/projects/wayback/wayback-core/src/test/java/org/archive/wayback/accesscontrol/staticmap/StaticMapExclusionFilterTest.java
===================================================================
--- trunk/archive-access/projects/wayback/wayback-core/src/test/java/org/archive/wayback/accesscontrol/staticmap/StaticMapExclusionFilterTest.java	2011-01-19 03:28:43 UTC (rev 3386)
+++ trunk/archive-access/projects/wayback/wayback-core/src/test/java/org/archive/wayback/accesscontrol/staticmap/StaticMapExclusionFilterTest.java	2011-02-06 14:31:04 UTC (rev 3387)
@@ -24,8 +24,10 @@
 import java.io.IOException;
 import java.util.Map;
 
+import org.archive.wayback.UrlCanonicalizer;
 import org.archive.wayback.core.CaptureSearchResult;
 import org.archive.wayback.util.ObjectFilter;
+import org.archive.wayback.util.url.AggressiveUrlCanonicalizer;
 
 import junit.framework.TestCase;
 
@@ -39,6 +41,7 @@
 
 	File tmpFile = null;
 	StaticMapExclusionFilterFactory factory = null;
+	UrlCanonicalizer canonicalizer = new AggressiveUrlCanonicalizer();
 
 	protected void setUp() throws Exception {
 		super.setUp();
@@ -62,6 +65,71 @@
 	/**
 	 * @throws Exception
 	 */
+	public void testRealWorld() throws Exception {
+		String bases[] = { "pho-c.co.jp/~clever",
+							"sf.net/pop/Roger",
+							"www.eva-stu.vn",
+							"mins.com.br/",
+							"24.ne.jp",
+							"24.ne.jp/~nekko"};
+//		setTmpContents(bases);
+		
+		
+		ObjectFilter<CaptureSearchResult> filter = getFilter(bases);
+		assertFalse("unmassaged",isBlocked(filter,"24.ne.jp.idpnt.com/robots.txt"));
+		assertTrue("massage",isBlocked(filter,"http://24.ne.jp:80/"));
+		assertTrue("unmassaged",isBlocked(filter,"http://www.pho-c.co.jp/~clever"));
+		assertTrue("massage",isBlocked(filter,"http://24.ne.jp"));
+
+		
+		assertTrue("unmassaged",isBlocked(filter,"http://www.pho-c.co.jp/~clever"));
+		assertTrue("massaged",isBlocked(filter,"http://pho-c.co.jp/~clever"));
+		assertTrue("trailing-slash",isBlocked(filter,"http://pho-c.co.jp/~clever/"));
+		assertTrue("subpath",isBlocked(filter,"http://pho-c.co.jp/~clever/foo.txt"));
+
+		assertTrue("full-port",isBlocked(filter,"http://www.mins.com.br:80"));
+		assertTrue("tail-slash-port",isBlocked(filter,"http://www.mins.com.br:80/"));
+		assertTrue("full",isBlocked(filter,"http://www.mins.com.br"));
+		assertTrue("tail-slash",isBlocked(filter,"http://www.mins.com.br/"));
+		assertTrue("full-massage",isBlocked(filter,"http://mins.com.br"));
+		assertTrue("tail-slash-massage",isBlocked(filter,"http://mins.com.br/"));
+		assertTrue("massage",isBlocked(filter,"http://mins.com.br/foo.txt"));
+		assertTrue("subpath",isBlocked(filter,"http://www13.mins.com.br/~clever/foo.txt"));
+
+		assertTrue("massage",isBlocked(filter,"24.ne.jp"));
+		assertTrue("full",isBlocked(filter,"http://www.mins.com.br"));
+		assertTrue("subpath",isBlocked(filter,"www.24.ne.jp"));
+		assertTrue("tail-slash-massage",isBlocked(filter,"http://mins.com.br/"));
+		assertTrue("subpath",isBlocked(filter,"http://www.24.ne.jp:80/"));
+		
+
+		
+		
+		assertTrue(isBlocked(filter,"http://sf.net/pop/Roger"));
+		assertTrue(isBlocked(filter,"http://sf.net/pop/Roger/"));
+		assertTrue(isBlocked(filter,"http://sf.net/pop/Roger//"));
+		assertFalse(isBlocked(filter,"http://sf.net/pop/"));
+		assertTrue(isBlocked(filter,"http://sf.net/pop/Roger/2"));
+		assertTrue(isBlocked(filter,"http://sf.net/pop/Roger/23"));
+		assertTrue(isBlocked(filter,"http://www.sf.net/pop/Roger"));
+		assertTrue(isBlocked(filter,"http://www1.sf.net/pop/Roger"));
+		assertTrue(isBlocked(filter,"http://www23.sf.net/pop/Roger"));
+
+		assertTrue(isBlocked(filter,"http://www23.eva-stu.vn/"));
+		assertTrue(isBlocked(filter,"http://www23.eva-stu.vn"));
+		assertTrue(isBlocked(filter,"http://eva-stu.vn"));
+		assertTrue(isBlocked(filter,"http://www.eva-stu.vn/"));
+		assertTrue(isBlocked(filter,"http://eva-stu.vn/"));
+		assertTrue(isBlocked(filter,"http://www.eva-stu.vn/foo.txt"));
+		assertTrue(isBlocked(filter,"http://www2.eva-stu.vn/foo/bar.txt"));
+		assertTrue(isBlocked(filter,"http://eva-stu.vn/foo/bar.txt"));
+
+	}
+
+	
+	/**
+	 * @throws Exception
+	 */
 	public void testBaseNoPrefix() throws Exception {
 		String bases[] = {"http://www.peagreenboat.com/",
 							"http://peagreenboat.com/"};
@@ -93,7 +161,7 @@
 		
 		setTmpContents(lines);
 		Map<String,Object> map = factory.loadFile(tmpFile.getAbsolutePath());
-		return new StaticMapExclusionFilter(map);
+		return new StaticMapExclusionFilter(map,canonicalizer);
 	}
 	
 	private void setTmpContents(String[] lines) throws IOException {
This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site.
 |