public class DemoBingCrawler extends RamCrawler
autoParse, LOG, parseImg, regexRule, requester, visitordbManager, executeInterval, executor, fetcher, forcedSeeds, maxExecuteCount, nextFilter, resumable, RUNNING, seeds, status, STOPED, threads, topN| 构造器和说明 |
|---|
DemoBingCrawler(String keyword,
int maxPageNum) |
| 限定符和类型 | 方法和说明 |
|---|---|
static String |
createBingUrl(String keyword,
int pageNum)
根据关键词和页号拼接Bing搜索对应的URL
|
static void |
main(String[] args) |
void |
visit(Page page,
CrawlDatums next) |
startaddRegex, afterParse, execute, getRegexRule, getRequester, getResponse, getVisitor, isAutoParse, isParseImg, parseLink, setAutoParse, setParseImg, setRegexRule, setRequester, setVisitoraddSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, addSeed, getDBManager, getExecuteInterval, getExecutor, getMaxExecuteCount, getNextFilter, getThreads, getTopN, inject, injectForcedSeeds, isResumable, setDBManager, setExecuteInterval, setExecutor, setMaxExecuteCount, setNextFilter, setResumable, setThreads, setTopN, start, stop, toStringpublic void visit(Page page, CrawlDatums next)
Copyright © 2017. All Rights Reserved.