public final class UrlQueue extends Object
| 构造器和说明 |
|---|
UrlQueue() |
| 限定符和类型 | 方法和说明 |
|---|---|
static void |
addUnVisitedLinks(String seedName,
HashSet<String> links)
追加未访问的links队列
首先判断新抓取的link是否在已访问的队列中, 然后判断是否在未抓取的队列中 如果都不在的话则将其加进未访问的队列中 |
static void |
clearFailVisitedUrl(String seedName)
清空已访问失败url队列
|
static void |
clearVisitedLink(String seedName)
清空已访问link队列
|
static void |
clearVisitedResource(String seedName)
清空已访问resource队列
|
static Collection<String> |
getFailVisitedUrl(String seedName)
获取已访问失败的url队列
|
static long |
getFailVisitedUrlCount(String seedName) |
static String |
getFirst(String seedName)
获取头元素
|
static Queue<String> |
getUnVisitedLink(String seedName)
获取未访问link队列
|
static Queue<String> |
getUnVisitedResource(String seedName)
获取未访问resource队列
|
static long |
getUnVisitedUrlCount(String seedName) |
static Queue<String> |
getVisitedLink(String seedName)
获取已访问link队列
|
static Queue<String> |
getVisitedResource(String seedName)
获取已访问resource队列
|
static long |
getVisitedUrlCount(String seedName) |
static boolean |
isEmptyUnVisitedLinks(String seedName)
判断未访问链接是否为空
|
static void |
newFailVisitedUrl(String seedName,
String failurl)
增加已访问失败的url(包括link、资源文件)
|
static void |
newUnVisitedLink(String seedName,
String link)
新增未访问的link到队列中
|
static void |
newUnVisitedResource(String seedName,
String resourceLink)
新增未访问的resource到队列中
|
static void |
newVisitedLink(String seedName,
String link)
新增已访问的link到队列中
|
static void |
newVisitedResource(String seedName,
String resource)
新增已访问的resource到队列中
|
static String |
outFirst(String seedName)
删除头元素
|
static void |
registerRedisQueue(Queue<String> redisQueue) |
public static long getVisitedUrlCount(String seedName)
public static long getUnVisitedUrlCount(String seedName)
public static long getFailVisitedUrlCount(String seedName)
public static void addUnVisitedLinks(String seedName, HashSet<String> links)
seedName - Stringlinks - HashSetpublic static void newUnVisitedLink(String seedName, String link)
seedName - Stringlink - Stringpublic static boolean isEmptyUnVisitedLinks(String seedName)
seedName - Stringpublic static void newUnVisitedResource(String seedName, String resourceLink)
seedName - StringresourceLink - Stringpublic static void newVisitedLink(String seedName, String link)
seedName - Stringlink - Stringpublic static void newVisitedResource(String seedName, String resource)
seedName - Stringresource - Stringpublic static void newFailVisitedUrl(String seedName, String failurl)
seedName - Stringfailurl - Stringpublic static Queue<String> getUnVisitedLink(String seedName)
seedName - Stringpublic static Queue<String> getUnVisitedResource(String seedName)
seedName - Stringpublic static Queue<String> getVisitedLink(String seedName)
seedName - Stringpublic static void clearVisitedLink(String seedName)
seedName - Stringpublic static void clearFailVisitedUrl(String seedName)
seedName - Stringpublic static Queue<String> getVisitedResource(String seedName)
seedName - Stringpublic static void clearVisitedResource(String seedName)
seedName - Stringpublic static Collection<String> getFailVisitedUrl(String seedName)
seedName - StringCopyright © 2018. All rights reserved.