Class Crawler
- java.lang.Object
-
- gov.nasa.pds.tools.validate.crawler.Crawler
-
- Direct Known Subclasses:
FileCrawler
,URLCrawler
public abstract class Crawler extends Object
-
-
Field Summary
Fields Modifier and Type Field Description protected FileFilter
directoryFilter
A directory filter.protected org.apache.commons.io.filefilter.IOFileFilter
fileFilter
A file filter.protected ArrayList<Target>
ignoreList
-
Method Summary
All Methods Instance Methods Abstract Methods Concrete Methods Modifier and Type Method Description void
addAllIgnoreItems(ArrayList<Target> ignoreList)
List<Target>
crawl(URL url)
List<Target>
crawl(URL url, boolean getDirectories)
abstract List<Target>
crawl(URL url, boolean getDirectories, org.apache.commons.io.filefilter.IOFileFilter fileFilter)
List<Target>
crawl(URL url, String[] extensions, boolean getDirectories, String nameToken)
List<Target>
crawl(URL url, org.apache.commons.io.filefilter.IOFileFilter fileFilter)
void
setFileFilter(List<String> fileFilters)
void
setFileFilter(org.apache.commons.io.filefilter.IOFileFilter fileFilter)
-
-
-
Field Detail
-
fileFilter
protected org.apache.commons.io.filefilter.IOFileFilter fileFilter
A file filter.
-
directoryFilter
protected FileFilter directoryFilter
A directory filter.
-
-
Method Detail
-
setFileFilter
public void setFileFilter(org.apache.commons.io.filefilter.IOFileFilter fileFilter)
-
crawl
public List<Target> crawl(URL url) throws IOException
- Throws:
IOException
-
crawl
public List<Target> crawl(URL url, org.apache.commons.io.filefilter.IOFileFilter fileFilter) throws IOException
- Throws:
IOException
-
crawl
public List<Target> crawl(URL url, boolean getDirectories) throws IOException
- Throws:
IOException
-
crawl
public List<Target> crawl(URL url, String[] extensions, boolean getDirectories, String nameToken) throws IOException
- Throws:
IOException
-
crawl
public abstract List<Target> crawl(URL url, boolean getDirectories, org.apache.commons.io.filefilter.IOFileFilter fileFilter) throws IOException
- Throws:
IOException
-
-