1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23 package org.archive.access.nutch;
24
25 import java.io.IOException;
26
27 import org.apache.hadoop.io.Text;
28
29 import junit.framework.TestCase;
30
31 /***
32 * @author stack
33 * @version $Date: 2006-12-15 00:49:38 +0000 (Fri, 15 Dec 2006) $ $Version$
34 */
35 public class NutchwaxTest extends TestCase {
36 public void testGetCollectionFromWaxKey() throws IOException {
37 String key = " c=nla2005,u=http://www.funkmymobile.com.au/en/" +
38 "download.php?f=c_14&a=khamega&type=14&id=5247&son_nom=" +
39 "??%20Janta%20??%20Ja&son_wav=jantaja.mp3&lang=EN&c=GB\n";
40 String collection = "nla2005";
41 assertEquals(Nutchwax.getCollectionFromWaxKey(new Text(key)),
42 collection);
43 key = "c=nla2005,u=http://www.mobilewallpapers.com.au/en/download." +
44 "php?f=c_14&a=mowall&type=14&id=5247&son_nom=??%20Janta%20??%20" +
45 "Ja&son_wav=jantaja.mp3&lang=EN&c=GB";
46 assertEquals(Nutchwax.getCollectionFromWaxKey(new Text(key)),
47 collection);
48 key = "c=5b5c430260d421a0ac8fdd461142e867,u=http://history." +
49 "sacentral.sa.gov.au/site/page.cfm?u=47&listMode=" +
50 "listLinks&path=\n 4873,4884,4894";
51 collection = "5b5c430260d421a0ac8fdd461142e867";
52 assertEquals(Nutchwax.getCollectionFromWaxKey(new Text(key)),
53 collection);
54 String url = "http://history." +
55 "sacentral.sa.gov.au/site/page.cfm?u=47&listMode=" +
56 "listLinks&path=\n 4873,4884,4894";
57 assertEquals(Nutchwax.getUrlFromWaxKey(new Text(key)),
58 url);
59 }
60 }