org.archive.wayback.resourcestore.indexer
Class WarcIndexer

java.lang.Object
  extended by org.archive.wayback.resourcestore.indexer.WarcIndexer

public class WarcIndexer
extends Object


Constructor Summary
WarcIndexer()
           
 
Method Summary
 UrlCanonicalizer getCanonicalizer()
           
 boolean isProcessAll()
           
 CloseableIterator<CaptureSearchResult> iterator(File warc)
           
 CloseableIterator<CaptureSearchResult> iterator(String pathOrUrl)
           
 CloseableIterator<CaptureSearchResult> iterator(org.archive.io.warc.WARCReader reader)
           
 void setCanonicalizer(UrlCanonicalizer canonicalizer)
           
 void setProcessAll(boolean processAll)
           
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 

Constructor Detail

WarcIndexer

public WarcIndexer()
Method Detail

isProcessAll

public boolean isProcessAll()

setProcessAll

public void setProcessAll(boolean processAll)

iterator

public CloseableIterator<CaptureSearchResult> iterator(File warc)
                                                throws IOException
Parameters:
warc -
Returns:
Iterator of SearchResults for input arc File
Throws:
IOException

iterator

public CloseableIterator<CaptureSearchResult> iterator(String pathOrUrl)
                                                throws IOException
Parameters:
pathOrUrl -
Returns:
Iterator of SearchResults for input pathOrUrl
Throws:
IOException

iterator

public CloseableIterator<CaptureSearchResult> iterator(org.archive.io.warc.WARCReader reader)
                                                throws IOException
Parameters:
arc -
Returns:
Iterator of SearchResults for input arc File
Throws:
IOException

getCanonicalizer

public UrlCanonicalizer getCanonicalizer()

setCanonicalizer

public void setCanonicalizer(UrlCanonicalizer canonicalizer)


Copyright © 2005-2011 Internet Archive. All Rights Reserved.