public class WarcIndexer extends Object
Constructor and Description |
---|
WarcIndexer() |
Modifier and Type | Method and Description |
---|---|
UrlCanonicalizer |
getCanonicalizer() |
boolean |
isProcessAll() |
org.archive.util.iterator.CloseableIterator<CaptureSearchResult> |
iterator(File warc) |
org.archive.util.iterator.CloseableIterator<CaptureSearchResult> |
iterator(String pathOrUrl) |
org.archive.util.iterator.CloseableIterator<CaptureSearchResult> |
iterator(org.archive.io.warc.WARCReader reader) |
void |
setCanonicalizer(UrlCanonicalizer canonicalizer) |
void |
setProcessAll(boolean processAll) |
public boolean isProcessAll()
public void setProcessAll(boolean processAll)
public org.archive.util.iterator.CloseableIterator<CaptureSearchResult> iterator(File warc) throws IOException
warc
- IOException
public org.archive.util.iterator.CloseableIterator<CaptureSearchResult> iterator(String pathOrUrl) throws IOException
pathOrUrl
- IOException
public org.archive.util.iterator.CloseableIterator<CaptureSearchResult> iterator(org.archive.io.warc.WARCReader reader) throws IOException
reader
- The reader for the arc file to search.IOException
public UrlCanonicalizer getCanonicalizer()
public void setCanonicalizer(UrlCanonicalizer canonicalizer)
Copyright © 2005–2015 IIPC. All rights reserved.