public class DemoDepthCrawler extends BreadthCrawler
autoParse, LOG, parseImg, regexRule, requester, visitordbManager, executeInterval, executor, fetcher, forcedSeeds, maxExecuteCount, nextFilter, resumable, RUNNING, seeds, status, STOPED, threads, topN| 构造器和说明 |
|---|
DemoDepthCrawler(String crawlPath,
boolean autoParse) |
| 限定符和类型 | 方法和说明 |
|---|---|
protected void |
afterParse(Page page,
CrawlDatums next) |
static void |
main(String[] args) |
void |
visit(Page page,
CrawlDatums next) |
addRegex, execute, getRegexRule, getRequester, getResponse, getVisitor, isAutoParse, isParseImg, parseLink, setAutoParse, setParseImg, setRegexRule, setRequester, setVisitoraddSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, getDBManager, getExecuteInterval, getExecutor, getMaxExecuteCount, getNextFilter, getThreads, getTopN, inject, injectForcedSeeds, isResumable, setDBManager, setExecuteInterval, setExecutor, setMaxExecuteCount, setNextFilter, setResumable, setThreads, setTopN, start, stop, toStringpublic DemoDepthCrawler(String crawlPath, boolean autoParse)
public void visit(Page page, CrawlDatums next)
protected void afterParse(Page page, CrawlDatums next)
afterParse 在类中 AutoParseCrawlerCopyright © 2017. All Rights Reserved.