public class Crawler extends Observable
| Constructor and Description |
|---|
Crawler(String host,
String start,
int threads,
int max,
boolean tidy) |
Crawler(String host,
String username,
String password,
String start,
int threads,
int max,
boolean tidy) |
| Modifier and Type | Method and Description |
|---|---|
void |
awaitTermination(long timeout,
TimeUnit unit) |
int |
getDispatchedCount() |
DTDMemoryCache |
getDtdMemoryCache() |
List<ICrawlerFilter> |
getFilters() |
String |
getHost() |
SAXParserFactory |
getParserFactory() |
String |
getPassword() |
int |
getRetrievedCount() |
String |
getUsername() |
Map<String,CrawlerResult> |
getVisitedURLs() |
static void |
main(String[] args) |
protected BlockingQueue<Runnable> |
newBlockingQueue() |
protected ICrawlerHistory |
newCrawlerHistory() |
protected CrawlerTask |
newCrawlerTask(String url,
CrawlerReferrer referrer,
boolean tidy) |
void |
queue(String url,
CrawlerReferrer referrer) |
protected void |
report(CrawlerResult result) |
void |
shutdown() |
addObserver, clearChanged, countObservers, deleteObserver, deleteObservers, hasChanged, notifyObservers, notifyObservers, setChangedpublic static final Object FINISH
protected BlockingQueue<Runnable> newBlockingQueue()
protected ICrawlerHistory newCrawlerHistory()
public void queue(String url, CrawlerReferrer referrer)
protected CrawlerTask newCrawlerTask(String url, CrawlerReferrer referrer, boolean tidy)
protected void report(CrawlerResult result)
public Map<String,CrawlerResult> getVisitedURLs()
public int getDispatchedCount()
public int getRetrievedCount()
public List<ICrawlerFilter> getFilters()
public String getHost()
public SAXParserFactory getParserFactory()
public DTDMemoryCache getDtdMemoryCache()
public String getUsername()
public String getPassword()
public void shutdown()
public void awaitTermination(long timeout,
TimeUnit unit)
throws InterruptedException
InterruptedExceptionpublic static void main(String[] args) throws InterruptedException
InterruptedExceptionCopyright © 2015 Molindo GmbH. All Rights Reserved.