Class Crawler
java.lang.Object
gov.nasa.pds.tools.validate.crawler.Crawler
- Direct Known Subclasses:
FileCrawler
,URLCrawler
public abstract class Crawler extends Object
-
Field Summary
Fields Modifier and Type Field Description protected FileFilter
directoryFilter
A directory filter.protected org.apache.commons.io.filefilter.IOFileFilter
fileFilter
A file filter.protected ArrayList<Target>
ignoreList
-
Constructor Summary
-
Method Summary
Modifier and Type Method Description void
addAllIgnoreItems(ArrayList<Target> ignoreList)
List<Target>
crawl(URL url)
List<Target>
crawl(URL url, boolean getDirectories)
abstract List<Target>
crawl(URL url, boolean getDirectories, org.apache.commons.io.filefilter.IOFileFilter fileFilter)
List<Target>
crawl(URL url, String[] extensions, boolean getDirectories, String nameToken)
List<Target>
crawl(URL url, org.apache.commons.io.filefilter.IOFileFilter fileFilter)
void
setFileFilter(List<String> fileFilters)
void
setFileFilter(org.apache.commons.io.filefilter.IOFileFilter fileFilter)
-
Field Details
-
fileFilter
protected org.apache.commons.io.filefilter.IOFileFilter fileFilterA file filter. -
directoryFilter
A directory filter. -
ignoreList
-
-
Constructor Details
-
Crawler
public Crawler() -
Crawler
public Crawler(org.apache.commons.io.filefilter.IOFileFilter fileFilter)
-
-
Method Details
-
addAllIgnoreItems
-
setFileFilter
-
setFileFilter
public void setFileFilter(org.apache.commons.io.filefilter.IOFileFilter fileFilter) -
crawl
- Throws:
IOException
-
crawl
public List<Target> crawl(URL url, org.apache.commons.io.filefilter.IOFileFilter fileFilter) throws IOException- Throws:
IOException
-
crawl
- Throws:
IOException
-
crawl
public List<Target> crawl(URL url, String[] extensions, boolean getDirectories, String nameToken) throws IOException- Throws:
IOException
-
crawl
public abstract List<Target> crawl(URL url, boolean getDirectories, org.apache.commons.io.filefilter.IOFileFilter fileFilter) throws IOException- Throws:
IOException
-