Skip navigation links
A B C D E F G H I K L M N O P Q R S T U V W Z 

A

ACCEPT_ALL - Static variable in interface de.l3s.icrawl.crawler.urls.UrlFilter
 
addDefaultProps(ImmutableMap.Builder<String, Object>) - Method in class de.l3s.icrawl.crawler.yarn.AppMaster
 
addDefaultProps(ImmutableMap.Builder<String, Object>) - Method in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
addDefaultProps(ImmutableMap.Builder<String, Object>) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationAppMaster
 
addLabel(NamedEntity.Label) - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
addLabel(String, Locale) - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
addListener(StoppingCriterion.StopListener) - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
addParameters(ImmutableMap.Builder<String, String>) - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
addParameters(ImmutableMap.Builder<String, String>) - Method in class de.l3s.icrawl.crawler.yarn.Client
 
addParameters(ImmutableMap.Builder<String, String>) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
addResources(ImmutableMap.Builder<String, LocalResource>) - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
addResources(ImmutableMap.Builder<String, LocalResource>) - Method in class de.l3s.icrawl.crawler.yarn.Client
 
addResources(ImmutableMap.Builder<String, LocalResource>) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
afterDate(LocalDate, Period) - Static method in class de.l3s.icrawl.crawler.TimeSpecification
 
analyse(Snapshot, CrawlUrl) - Method in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser
 
analyze(List<String>, Set<String>) - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser
 
AppMaster - Class in de.l3s.icrawl.crawler.yarn
 
AppMaster() - Constructor for class de.l3s.icrawl.crawler.yarn.AppMaster
 
ArchiveCrawler - Class in de.l3s.icrawl.crawler
 
ArchiveCrawler() - Constructor for class de.l3s.icrawl.crawler.ArchiveCrawler
 
ArchiveCrawler.CsvStorerConfig - Class in de.l3s.icrawl.crawler
 
ArchiveCrawler.StorerConfig - Interface in de.l3s.icrawl.crawler
 
ArchiveCrawler.ZipFileStorerConfig - Class in de.l3s.icrawl.crawler
 
ArchiveCrawlSpecification - Class in de.l3s.icrawl.crawler
 
ArchiveCrawlSpecification(String, List<String>, List<String>, TimeSpecification, Map<Locale, DocumentVector>, Map<Locale, Set<String>>, String, Locale, Map<Locale, Double>) - Constructor for class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
ArchiveFetcher - Class in de.l3s.icrawl.crawler.io
 
ArchiveFetcher(Configuration, String, String, MetricRegistry, int) - Constructor for class de.l3s.icrawl.crawler.io.ArchiveFetcher
 
ArchiveRecordParser - Class in de.l3s.icrawl.snapshots
 
ArchiveRecordParser() - Constructor for class de.l3s.icrawl.snapshots.ArchiveRecordParser
 
asMap() - Method in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
 

B

BaseAppMaster - Class in de.l3s.icrawl.crawler.yarn
 
BaseAppMaster() - Constructor for class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
BaseClient - Class in de.l3s.icrawl.crawler.yarn
 
BaseClient() - Constructor for class de.l3s.icrawl.crawler.yarn.BaseClient
 
BaseFrontier - Class in de.l3s.icrawl.crawler.frontier
 
BaseFrontier(MetricRegistry) - Constructor for class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
BaseSnapshotsLocator - Class in de.l3s.icrawl.snapshots
 
BaseSnapshotsLocator(URLKeyMaker, MetricRegistry) - Constructor for class de.l3s.icrawl.snapshots.BaseSnapshotsLocator
 
binaryHeader() - Method in interface org.openimaj.io.ReadableBinary
Header for binary input.
binaryHeader() - Method in class org.openimaj.io.wrappers.Readable2DArrayBinary
 
binaryHeader() - Method in class org.openimaj.io.wrappers.ReadableArrayBinary
 
binaryHeader() - Method in class org.openimaj.io.wrappers.Writeable2DArrayBinary
 
binaryHeader() - Method in class org.openimaj.io.wrappers.WriteableArrayBinary
 
binaryHeader() - Method in interface org.openimaj.io.WriteableBinary
Header for binary output.
binaryHeader() - Method in class org.openimaj.text.nlp.language.LanguageModel
 
buildDocumentVector(String, LanguageModel.KeywordMatcher) - Method in class de.l3s.icrawl.contentanalysis.LanguageModel
 
buildDocumentVector(Locale, String, LanguageModel.KeywordMatcher) - Method in class de.l3s.icrawl.contentanalysis.LanguageModels
 
buildLanguage(String) - Static method in class com.sharethis.textrank.LanguageModel
Factory method, loads libraries for StanfordCoreNLP based on the given language code.
buildMatcher(Iterable<String>, int) - Method in class de.l3s.icrawl.contentanalysis.LanguageModel
 
buildMatcher(Locale, Iterable<String>, int) - Method in class de.l3s.icrawl.contentanalysis.LanguageModels
 
buildNGram(Graph, Sentence, List<Integer>, double) - Static method in class com.sharethis.textrank.NGram
Factory method.
buildNode(Graph, String, NodeValue) - Static method in class com.sharethis.textrank.Node
Factory method.
ByteBufferBackedInputStream - Class in de.l3s.icrawl.util
 
ByteBufferBackedInputStream(ByteBuffer) - Constructor for class de.l3s.icrawl.util.ByteBufferBackedInputStream
 

C

calcStats(Graph) - Static method in class com.sharethis.textrank.NGram
Determine a statistical distribution for the n-gram subgraph.
call() - Method in class com.sharethis.textrank.TextRank
Run the TextRank algorithm on the given semi-structured text (e.g., results of parsed HTML from crawled web content) to build a graph of weighted key phrases.
canonicalize(URL) - Method in class de.l3s.icrawl.crawler.urls.UrlCanonicalizerNormalizer.StripParametersCanonicalizer
 
Category() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.Category
 
checkUsage(String[]) - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
checkUsage(String[]) - Method in class de.l3s.icrawl.crawler.yarn.Client
 
checkUsage(String[]) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
classify(String) - Method in class org.openimaj.text.nlp.language.LanguageDetector
Classify the language using a naive-bayes model
cleanup() - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
cleanup() - Method in class de.l3s.icrawl.crawler.yarn.Client
 
cleanup() - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
Client - Class in de.l3s.icrawl.crawler.yarn
 
Client() - Constructor for class de.l3s.icrawl.crawler.yarn.Client
 
close() - Method in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
close() - Method in class de.l3s.icrawl.crawler.frontier.FileBasedFrontier
 
close() - Method in class de.l3s.icrawl.crawler.io.ArchiveFetcher
 
close() - Method in class de.l3s.icrawl.crawler.io.CsvStorer
 
close() - Method in class de.l3s.icrawl.crawler.io.LoggingStorer
 
close() - Method in class de.l3s.icrawl.crawler.io.ZipFileStorer
 
close() - Method in class de.l3s.icrawl.snapshots.HBaseSnapshotsLocator
 
collectNGrams(LanguageModel, List<Sentence>, double) - Static method in class com.sharethis.textrank.NGram
Report the n-grams marked in each sentence.
com.sharethis.textrank - package com.sharethis.textrank
 
compare(SnaphotLocation, SnaphotLocation) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
compareTo(MetricVector) - Method in class com.sharethis.textrank.MetricVector
Compare method for sort ordering.
compareTo(NGram) - Method in class com.sharethis.textrank.NGram
Compare method for sort ordering.
compareTo(Node) - Method in class com.sharethis.textrank.Node
Compare method for sort ordering.
CompositeStoppingCriterion - Class in de.l3s.icrawl.crawler.scheduling
 
CompositeStoppingCriterion(List<StoppingCriterion>) - Constructor for class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
CompositeStoppingCriterion(StoppingCriterion...) - Constructor for class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
conf - Variable in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
confidence - Variable in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
Naive bayesian probability
configure(String[]) - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
configure(String[]) - Method in class de.l3s.icrawl.crawler.yarn.Client
 
configure(String[]) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
connect(Node) - Method in class com.sharethis.textrank.Node
Connect two nodes with a bi-directional arc in the graph.
containingElement(Node) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
contains(ZonedDateTime) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
ContentAnalyser - Class in de.l3s.icrawl.contentanalysis
 
ContentAnalyser(LanguageDetector, LabelerFactory) - Constructor for class de.l3s.icrawl.contentanalysis.ContentAnalyser
 
ContentAnalyser.Counts - Class in de.l3s.icrawl.contentanalysis
 
Context - Class in com.sharethis.textrank
Track the context within a sentence for a selected n-gram.
Context(Sentence, int) - Constructor for class com.sharethis.textrank.Context
Constructor.
contexts - Variable in class com.sharethis.textrank.NGram
 
CoreNlpLanguageModel - Class in com.sharethis.textrank
Implementation of English-specific tools for natural language processing.
CoreNlpLanguageModel(WordsToSentencesAnnotator, TokenizerAnnotator, POSTaggerAnnotator, SnowballProgram) - Constructor for class com.sharethis.textrank.CoreNlpLanguageModel
 
cosineSimilarity(DocumentVector) - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
count_rank - Variable in class com.sharethis.textrank.MetricVector
 
crawl(ApplicationContext, Crawler) - Method in class de.l3s.icrawl.crawler.yarn.AppMaster
 
crawl(ApplicationContext, Crawler) - Method in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
crawl(ApplicationContext, Crawler) - Method in class de.l3s.icrawl.crawler.yarn.EvaluationAppMaster
 
crawlContinuously(ArchiveCrawlSpecification, StoppingCriterion, ResourceAnalyser.WeightingMethod, double, int) - Method in class de.l3s.icrawl.crawler.Crawler
 
CrawledResource - Class in de.l3s.icrawl.crawler
 
CrawledResource(CrawlUrl, Snapshot, double, ZonedDateTime) - Constructor for class de.l3s.icrawl.crawler.CrawledResource
 
CrawledResource(CrawlUrl, Snapshot, double, ZonedDateTime, Duration, double, double) - Constructor for class de.l3s.icrawl.crawler.CrawledResource
 
Crawler - Class in de.l3s.icrawl.crawler
 
Crawler(Configuration, String, String, ResourceAnalyserFactory, ResultStorer.Factory, MetricRegistry, int) - Constructor for class de.l3s.icrawl.crawler.Crawler
 
CrawlerThread - Class in de.l3s.icrawl.crawler
 
CrawlerThread(Frontier, ArchiveFetcher, ResultStorer, ResourceAnalyser, MetricRegistry, ArchiveCrawlSpecification, CountDownLatch, StoppingCriterion, double) - Constructor for class de.l3s.icrawl.crawler.CrawlerThread
 
CrawlSpecCreator - Class in de.l3s.icrawl.crawler.tools
 
CrawlSpecCreator() - Constructor for class de.l3s.icrawl.crawler.tools.CrawlSpecCreator
 
CrawlUrl - Class in de.l3s.icrawl.crawler
 
CrawlUrl(String, String, float, String, ZonedDateTime) - Constructor for class de.l3s.icrawl.crawler.CrawlUrl
 
CrawlUrl.Path - Enum in de.l3s.icrawl.crawler
 
createEmpty(int) - Method in class org.openimaj.io.wrappers.ReadableArrayBinary
 
CsvStorer - Class in de.l3s.icrawl.crawler.io
 
CsvStorer(Configuration, Path) - Constructor for class de.l3s.icrawl.crawler.io.CsvStorer
 
CsvStorerConfig() - Constructor for class de.l3s.icrawl.crawler.ArchiveCrawler.CsvStorerConfig
 
CUTOFF_DATE - Static variable in class de.l3s.icrawl.util.DateUtils
 

D

dateMetaKey(String) - Static method in class de.l3s.icrawl.util.DateUtils
 
DateUtils - Class in de.l3s.icrawl.util
 
de.l3s.icrawl.contentanalysis - package de.l3s.icrawl.contentanalysis
Analysis of crawled documents
de.l3s.icrawl.crawler - package de.l3s.icrawl.crawler
 
de.l3s.icrawl.crawler.analysis - package de.l3s.icrawl.crawler.analysis
Analysis of the content of crawled Web pages.
de.l3s.icrawl.crawler.frontier - package de.l3s.icrawl.crawler.frontier
Crawler queue / frontier management
de.l3s.icrawl.crawler.io - package de.l3s.icrawl.crawler.io
Fetching and storing of archive snapshots
de.l3s.icrawl.crawler.scheduling - package de.l3s.icrawl.crawler.scheduling
Stopping of running crawls
de.l3s.icrawl.crawler.tools - package de.l3s.icrawl.crawler.tools
Helper scripts
de.l3s.icrawl.crawler.ui - package de.l3s.icrawl.crawler.ui
HTTP interface to monitor a running crawl.
de.l3s.icrawl.crawler.urls - package de.l3s.icrawl.crawler.urls
Normalization and filtering of discovered URLs
de.l3s.icrawl.crawler.yarn - package de.l3s.icrawl.crawler.yarn
Runner classes to execute the crawler as a YARN job.
de.l3s.icrawl.domain.specification - package de.l3s.icrawl.domain.specification
 
de.l3s.icrawl.snapshots - package de.l3s.icrawl.snapshots
 
de.l3s.icrawl.util - package de.l3s.icrawl.util
 
defaultFactory() - Static method in class de.l3s.icrawl.contentanalysis.LabelerFactory
 
DirectoryPrefixResolver - Class in de.l3s.icrawl.snapshots
 
DirectoryPrefixResolver(String) - Constructor for class de.l3s.icrawl.snapshots.DirectoryPrefixResolver
 
disable(int) - Method in class de.l3s.icrawl.crawler.frontier.WeightedRandomSelector
 
disconnect(Node) - Method in class com.sharethis.textrank.Node
Disconnect two nodes removing their bi-directional arc in the graph.
dist_stats - Variable in class com.sharethis.textrank.Graph
Public members.
DocumentVector - Class in de.l3s.icrawl.contentanalysis
A sparse representation of a term frequency document vector
DocumentVector(Map<String, Double>) - Constructor for class de.l3s.icrawl.contentanalysis.DocumentVector
 
DocumentVector(Collection<String>) - Constructor for class de.l3s.icrawl.contentanalysis.DocumentVector
 
DocumentVectorSimilarity - Class in de.l3s.icrawl.contentanalysis
Class to compute the distance of a document to a document collection.
DocumentVectorSimilarity(Map<String, Locale>, Set<String>, Set<NamedEntity>, int, boolean, Locale, LanguageModels) - Constructor for class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
Create a SpecSimilarity Object that is serializable and stores a reference to the input's document collection.
DocumentVectorSimilarity(Map<Locale, DocumentVector>, Map<Locale, LanguageModel.KeywordMatcher>, Locale, Map<Locale, Double>) - Constructor for class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
dotProduct(DocumentVector) - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 

E

edges - Variable in class com.sharethis.textrank.Node
Public members.
elapsed_time - Variable in class com.sharethis.textrank.TextRank
 
EMPTY - Static variable in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Result
 
emptyQueue - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
enable(int) - Method in class de.l3s.icrawl.crawler.frontier.WeightedRandomSelector
 
encode(String) - Static method in class io.mola.galimatias.FormURLEncodedParser
encode(String, Charset) - Static method in class io.mola.galimatias.FormURLEncodedParser
encode(List<NameValue>) - Static method in class io.mola.galimatias.FormURLEncodedParser
Implements the application/x-www-form-urlencoded serializer.
encode(List<NameValue>, Charset) - Static method in class io.mola.galimatias.FormURLEncodedParser
Implements the application/x-www-form-urlencoded serializer.
englishModel() - Static method in class com.sharethis.textrank.CoreNlpLanguageModel
 
environment() - Method in class de.l3s.icrawl.crawler.ui.InfoController
 
equals(Object) - Method in class com.sharethis.textrank.MetricVector
 
equals(Object) - Method in class com.sharethis.textrank.NGram
 
equals(Object) - Method in class com.sharethis.textrank.Node
 
equals(Object) - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
equals(Object) - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
equals(Object) - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
equals(Object) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
equals(Object) - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
equals(Object) - Method in class de.l3s.icrawl.domain.specification.NamedEntity.Label
 
equals(Object) - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
equals(Object) - Method in class io.mola.galimatias.NameValue
 
equals(Object) - Method in class io.mola.galimatias.URLSearchParameters
 
equals(Object) - Method in class org.openimaj.text.nlp.language.LanguageModel
 
EvaluationAppMaster - Class in de.l3s.icrawl.crawler.yarn
 
EvaluationAppMaster() - Constructor for class de.l3s.icrawl.crawler.yarn.EvaluationAppMaster
 
EvaluationClient - Class in de.l3s.icrawl.crawler.yarn
 
EvaluationClient() - Constructor for class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
exists() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Link
 
extract(String, Collection<String>, LocalDate, LocalDate, Period, Period, String, File) - Method in class de.l3s.icrawl.crawler.tools.CrawlSpecCreator
 
extractDate(String) - Static method in class de.l3s.icrawl.util.DateUtils
 
extractDateFromUrl(String) - Static method in class de.l3s.icrawl.util.DateUtils
 
extractEntities(Labeler, String) - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser
 
extractEntities(String) - Method in class de.l3s.icrawl.contentanalysis.Labeler
 
ExtractionException(String, Throwable) - Constructor for exception de.l3s.icrawl.contentanalysis.WebPageDateExtractor.ExtractionException
 
ExtractionException(String) - Constructor for exception de.l3s.icrawl.contentanalysis.WebPageDateExtractor.ExtractionException
 
ExtractionException(Throwable) - Constructor for exception de.l3s.icrawl.contentanalysis.WebPageDateExtractor.ExtractionException
 
extractModifiedDate(Document) - Static method in class de.l3s.icrawl.contentanalysis.WebPageDateExtractor
Extract the likely modification date from a parsed document.
extractText(Element) - Static method in class de.l3s.icrawl.util.TextExtractor
 
extractText(Document) - Static method in class de.l3s.icrawl.util.TextExtractor
 
extractTextFromJavascript(Document) - Static method in class de.l3s.icrawl.util.WebPageUtils
 

F

Factory(MetricRegistry, float, float) - Constructor for class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Factory
 
FileBasedFrontier - Class in de.l3s.icrawl.crawler.frontier
 
FileBasedFrontier(File, MetricRegistry, int, boolean) - Constructor for class de.l3s.icrawl.crawler.frontier.FileBasedFrontier
 
findBest(Iterable<SnaphotLocation>) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
findBest(Iterable<SnaphotLocation>, int) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
findInternal(String) - Method in class de.l3s.icrawl.snapshots.BaseSnapshotsLocator
 
findInternal(String) - Method in class de.l3s.icrawl.snapshots.HBaseSnapshotsLocator
 
findLocation(String, ZonedDateTime) - Method in class de.l3s.icrawl.snapshots.BaseSnapshotsLocator
 
findLocation(String, ZonedDateTime) - Method in interface de.l3s.icrawl.snapshots.SnapshotsLocator
 
findLocations(String) - Method in class de.l3s.icrawl.snapshots.BaseSnapshotsLocator
 
findLocations(String) - Method in interface de.l3s.icrawl.snapshots.SnapshotsLocator
 
findOneInternal(String, ZonedDateTime) - Method in class de.l3s.icrawl.snapshots.BaseSnapshotsLocator
 
findOneInternal(String, ZonedDateTime) - Method in class de.l3s.icrawl.snapshots.HBaseSnapshotsLocator
 
findParagraphParent(Element, int) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
findParagraphParent(Element) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
findParagraphParent(Node, int) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
FormURLEncodedParser - Class in io.mola.galimatias
Parses query strings with application/x-www-form-urlencoded rules.
from - Variable in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
fromMap(Map<String, Object>) - Static method in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
 
fromSeed(String, float) - Static method in class de.l3s.icrawl.crawler.CrawlUrl
 
fromVectors(Map<Locale, DocumentVector>, Map<Locale, Set<String>>, Locale, LanguageModels, Map<Locale, Double>) - Static method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
Frontier - Interface in de.l3s.icrawl.crawler.frontier
 

G

generate(Locale, int, String) - Method in class org.openimaj.text.nlp.language.MarkovChainLanguageModel
Generate a string using this model of the desired length
germanModel() - Static method in class com.sharethis.textrank.CoreNlpLanguageModel
 
get(LanguageDetector.WeightedLocale) - Method in class de.l3s.icrawl.contentanalysis.LabelerFactory
 
get(ArchiveCrawlSpecification, ResourceAnalyser.WeightingMethod) - Method in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Factory
 
get(ArchiveCrawlSpecification, ResourceAnalyser.WeightingMethod) - Method in interface de.l3s.icrawl.crawler.analysis.ResourceAnalyserFactory
 
get(CrawlUrl, TimeSpecification) - Method in class de.l3s.icrawl.crawler.io.ArchiveFetcher
 
get(String) - Method in interface de.l3s.icrawl.crawler.io.ResultStorer.Factory
 
get(String) - Method in class io.mola.galimatias.URLSearchParameters
 
getAll(String) - Method in class io.mola.galimatias.URLSearchParameters
 
getAnchor() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getAppMasterClass() - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
getAppMasterClass() - Method in class de.l3s.icrawl.crawler.yarn.Client
 
getAppMasterClass() - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
getAutonym() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
getByteOffset() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getCategories() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getCharset(byte[], int, HttpHeaders) - Method in class de.l3s.icrawl.snapshots.OnlyHtmlCharsetDetector
 
getCollocation() - Method in class com.sharethis.textrank.NodeValue
Create a collocation out of the text for lookup in WordNet.
getContent() - Method in class de.l3s.icrawl.crawler.Resource
 
getContent() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getCorrectionFactors() - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
getCorrectionFactors() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getCount() - Method in class com.sharethis.textrank.NGram
Determine the count, i.e., how often this n-gram recurs within the text.
getCrawlPriority() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getCrawlTime() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getCrawlTime() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getCurrentSpec() - Method in class de.l3s.icrawl.crawler.Crawler
 
getDate() - Method in class de.l3s.icrawl.contentanalysis.WebPageDateExtractor.WebPageDate
 
getDateSource() - Method in class de.l3s.icrawl.contentanalysis.WebPageDateExtractor.WebPageDate
 
getDefaultLanguage() - Method in class de.l3s.icrawl.contentanalysis.LanguageModels
 
getDefaultLanguage() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getDescription() - Method in class com.sharethis.textrank.KeyWord
Create a description text for this value.
getDescription() - Method in class com.sharethis.textrank.NGram
Create a description text for this value.
getDescription() - Method in class com.sharethis.textrank.NodeValue
Create a description text for this value.
getDescription() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getDetectedKeywords() - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
getDisplayTitle() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getDocumentLength() - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
getEnd() - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
getEntities() - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
getExternalLinks() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getFrom() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
getFromtitle() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getGraph() - Method in class com.sharethis.textrank.TextRank
Accessor for the graph.
getHeaders() - Method in class de.l3s.icrawl.crawler.Resource
 
getHeaders() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getId() - Method in class com.sharethis.textrank.Node
Create a unique identifier for this node, returned as a hex string.
getImages() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getIndex() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getInstance() - Static method in class io.mola.galimatias.FormURLEncodedParser
Deprecated.
getInterWikiLinks() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getJarPath() - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
getJarPath() - Method in class de.l3s.icrawl.crawler.yarn.Client
 
getJarPath() - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
getKeywords() - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
getKeywords() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getLabels() - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
getLang() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
getLangCode() - Method in enum de.l3s.icrawl.contentanalysis.TextRankWrapper.LANG_CODE
 
getLangLinks() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getLangName() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
getLanguage() - Method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
getLanguage() - Method in class de.l3s.icrawl.domain.specification.NamedEntity.Label
Get the language of the label.
getLanguageModel() - Method in class org.openimaj.text.nlp.language.LanguageDetector
 
getLength() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getLevel() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getLine() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getLinks() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getLocale() - Method in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
 
getMatchers() - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
getMaxRelevance() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getMaxUrls() - Method in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
getMimeType() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getMimeType() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getMinRelevance() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getModifiedDate(String, Document, Long, Mapper<?, ?, ?, ?>.Context) - Static method in class de.l3s.icrawl.contentanalysis.WebPageDateExtractor
 
getModifiedDate() - Method in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Result
 
getModifiedDate() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getName() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getName() - Method in enum de.l3s.icrawl.crawler.CrawlUrl.Path
 
getName() - Method in class de.l3s.icrawl.domain.specification.NamedEntity.Label
Get the name of the label
getName() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Category
 
getName() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.InterWikiLink
 
getName() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Link
 
getNamespace() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Link
 
getNextMessage() - Method in class net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage
 
getNodeKey(String, String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
getNodeKey(String, String) - Method in class com.sharethis.textrank.LanguageModel
Prepare a stable key for a graph node (stemmed, lemmatized) from a token.
getNumber() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getOriginalUrl() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getOutlinks() - Method in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Result
 
getPageId() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getPageName() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
getPath() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getPath() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
getPrefix() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.InterWikiLink
 
getPriority() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
getProfiles() - Method in class de.l3s.icrawl.crawler.yarn.AppMaster
 
getProfiles() - Method in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
getProfiles() - Method in class de.l3s.icrawl.crawler.yarn.EvaluationAppMaster
 
getProgress() - Method in class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
getProgress() - Method in class de.l3s.icrawl.crawler.scheduling.NumberOfUrlsStoppingCriterion
 
getProgress() - Method in class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 
getProgress() - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
getProperties() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getRankThreshold() - Method in class com.sharethis.textrank.Graph
Calculate a threshold for the ranked results.
getRedirects() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getReferenceDocuments() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getReferenceTime() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getReferenceVectors() - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
getReferenceVectors() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getRefererCrawlTime() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
getReferrer() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
getRelevance() - Method in class de.l3s.icrawl.crawler.analysis.ResourceAnalyser.Result
 
getRelevance() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getRelevance(ZonedDateTime) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
getRelevanceExp(ZonedDateTime) - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
getResource() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getResource(Path, Configuration, LocalResourceType) - Static method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
getResult() - Method in class net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage
 
getRevId() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getSections() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getSeedUrls() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
getServerPort() - Method in class de.l3s.icrawl.crawler.ArchiveCrawler
 
getSignature() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getSimilarity(Locale, String) - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
getSimilarity(Locale, String, DocumentVector, LanguageModel.KeywordMatcher) - Method in class de.l3s.icrawl.contentanalysis.LanguageModels
calculate the cosine-similarity of the doc to the specification
getSnapshotsDuration() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getSortkey() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Category
 
getStart() - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
getStatus() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
getTemplates() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getText() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getTitle() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
getTo() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
getTocLevel() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
getToFragment() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
getType() - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
getUrl() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
getUrl() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
getUrl() - Method in class de.l3s.icrawl.crawler.Resource
 
getUrl() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getUrl() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.InterWikiLink
 
getUrl() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
getValue() - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
getWarcFile() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
getWarcFileOffset() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
Graph - Class in com.sharethis.textrank
An abstraction for handling the graph as a data object.
Graph() - Constructor for class com.sharethis.textrank.Graph
 
graph - Variable in class com.sharethis.textrank.TextRank
 

H

has(String) - Method in class io.mola.galimatias.URLSearchParameters
 
hashCode() - Method in class com.sharethis.textrank.MetricVector
 
hashCode() - Method in class com.sharethis.textrank.NGram
 
hashCode() - Method in class com.sharethis.textrank.Node
 
hashCode() - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
hashCode() - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
hashCode() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
hashCode() - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
hashCode() - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
hashCode() - Method in class de.l3s.icrawl.domain.specification.NamedEntity.Label
 
hashCode() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
hashCode() - Method in class io.mola.galimatias.NameValue
 
hashCode() - Method in class io.mola.galimatias.URLSearchParameters
 
hasHtmlContent(String) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
HBaseSnapshotsLocator - Class in de.l3s.icrawl.snapshots
 
HBaseSnapshotsLocator(Configuration, MetricRegistry) - Constructor for class de.l3s.icrawl.snapshots.HBaseSnapshotsLocator
 
HBaseSnapshotsLocator(Configuration, URLKeyMaker, MetricRegistry) - Constructor for class de.l3s.icrawl.snapshots.HBaseSnapshotsLocator
 
HdfsSnapshotReader - Class in de.l3s.icrawl.snapshots
 
HdfsSnapshotReader(Configuration, MetricRegistry) - Constructor for class de.l3s.icrawl.snapshots.HdfsSnapshotReader
 
HtmlParseException - Exception in de.l3s.icrawl.util
 
HtmlParseException(String, Throwable) - Constructor for exception de.l3s.icrawl.util.HtmlParseException
 

I

IDF_DICTIONARY_DE - Static variable in class de.l3s.icrawl.crawler.ArchiveCrawler
 
INCLUSIVE_COEFF - Static variable in class com.sharethis.textrank.Graph
Public definitions.
incoming - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
InfoController - Class in de.l3s.icrawl.crawler.ui
 
InfoController() - Constructor for class de.l3s.icrawl.crawler.ui.InfoController
 
InMemoryFrontier - Class in de.l3s.icrawl.crawler.frontier
 
InMemoryFrontier(MetricRegistry) - Constructor for class de.l3s.icrawl.crawler.frontier.InMemoryFrontier
 
interval(LocalDate, LocalDate, Period) - Static method in class de.l3s.icrawl.crawler.TimeSpecification
 
interval(LocalDate, LocalDate, Period, Period) - Static method in class de.l3s.icrawl.crawler.TimeSpecification
 
InterWikiLink() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.InterWikiLink
 
io.mola.galimatias - package io.mola.galimatias
 
IOUtils - Class in org.openimaj.io
Methods for reading Readable objects and writing Writeable objects.
IOUtils() - Constructor for class org.openimaj.io.IOUtils
 
isAdjective(String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
isAdjective(String) - Method in class com.sharethis.textrank.LanguageModel
Determine whether the given PoS tag is an adjective.
isHidden() - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Category
 
isNoun(String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
isNoun(String) - Method in class com.sharethis.textrank.LanguageModel
Determine whether the given PoS tag is a noun.
isRelevant(String) - Method in class com.sharethis.textrank.LanguageModel
Determine whether the given PoS tag is relevant to add to the graph.
isTimeSensitive() - Method in enum de.l3s.icrawl.crawler.analysis.ResourceAnalyser.WeightingMethod
 
isValidDate(ZonedDateTime) - Static method in class de.l3s.icrawl.util.DateUtils
 
iterateGraph(int) - Method in class com.sharethis.textrank.Graph
Iterate through the graph, calculating rank.
iterator() - Method in class io.mola.galimatias.URLSearchParameters
 

K

key - Variable in class com.sharethis.textrank.Node
 
KeyWord - Class in com.sharethis.textrank
Implements a node value in a TextRank graph denoting a noun or adjective.
KeyWord(String, String) - Constructor for class com.sharethis.textrank.KeyWord
Constructor.
KEYWORD_REDUCTION_FACTOR - Static variable in class com.sharethis.textrank.Graph
 

L

Label(String, Locale) - Constructor for class de.l3s.icrawl.domain.specification.NamedEntity.Label
Create a new label with name and language
Labeler - Class in de.l3s.icrawl.contentanalysis
 
Labeler(CRFClassifier<CoreMap>, Locale, String, String, String) - Constructor for class de.l3s.icrawl.contentanalysis.Labeler
 
LabelerFactory - Class in de.l3s.icrawl.contentanalysis
 
LabelerFactory(Map<String, Labeler>, String, Function<String, Labeler>) - Constructor for class de.l3s.icrawl.contentanalysis.LabelerFactory
 
lang - Variable in class com.sharethis.textrank.TextRank
Protected members.
LangLink() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.LangLink
 
language - Variable in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
Estimated language
LANGUAGE_MODEL_BINARY - Static variable in class org.openimaj.text.nlp.language.LanguageDetector
default location of the compressed binary version of the language model
LanguageDetector - Class in org.openimaj.text.nlp.language
Short text language detection ported from langid: https://github.com/saffsd/langid.py
LanguageDetector() - Constructor for class org.openimaj.text.nlp.language.LanguageDetector
LanguageDetector.WeightedLocale - Class in org.openimaj.text.nlp.language
A langauge with an associated confidence
LanguageModel - Class in com.sharethis.textrank
Facade for handling language-specific tools in natural language processing.
LanguageModel() - Constructor for class com.sharethis.textrank.LanguageModel
 
LanguageModel - Class in de.l3s.icrawl.contentanalysis
 
LanguageModel(Analyzer, Map<String, Double>) - Constructor for class de.l3s.icrawl.contentanalysis.LanguageModel
 
LanguageModel - Class in org.openimaj.text.nlp.language
The data used by LanguageDetector
LanguageModel() - Constructor for class org.openimaj.text.nlp.language.LanguageModel
do nothing
LanguageModel(Map<String, Object>) - Constructor for class org.openimaj.text.nlp.language.LanguageModel
 
LanguageModels - Class in de.l3s.icrawl.contentanalysis
 
LanguageModels(Locale, Map<String, Double>, Locale) - Constructor for class de.l3s.icrawl.contentanalysis.LanguageModels
 
LanguageModels(Locale, Map<Locale, LanguageModel>) - Constructor for class de.l3s.icrawl.contentanalysis.LanguageModels
 
length - Variable in class com.sharethis.textrank.NGram
 
liberalParseDate(String) - Static method in class de.l3s.icrawl.util.DateUtils
Try very hard to parse the parameter as a date.
Link() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.Link
 
link_rank - Variable in class com.sharethis.textrank.MetricVector
 
list() - Method in class de.l3s.icrawl.crawler.ui.InfoController
 
LocationResolver - Interface in de.l3s.icrawl.snapshots
 
lock - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
LoggingStorer - Class in de.l3s.icrawl.crawler.io
 
LoggingStorer() - Constructor for class de.l3s.icrawl.crawler.io.LoggingStorer
 

M

main(String[]) - Static method in class de.l3s.icrawl.crawler.ArchiveCrawler
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.tools.CrawlSpecCreator
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.tools.MergeExternalUrls
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.tools.QueryKeywordsCreator
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.yarn.AppMaster
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.yarn.Client
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.yarn.EvaluationAppMaster
 
main(String[]) - Static method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
main(String[]) - Static method in class org.openimaj.text.nlp.language.LanguageDetector
prints available languages
map(String) - Method in class de.l3s.icrawl.contentanalysis.Labeler
 
mapTokens(LanguageModel, Graph) - Method in class com.sharethis.textrank.Sentence
Main processing per sentence.
marked - Variable in class com.sharethis.textrank.Node
 
MarkovChainLanguageModel - Class in org.openimaj.text.nlp.language
Code to train, classify and generate language specific text by building a first order markov chain.
MarkovChainLanguageModel() - Constructor for class org.openimaj.text.nlp.language.MarkovChainLanguageModel
Generate a new empty markov chain language model
MAX_NGRAM_LENGTH - Static variable in class com.sharethis.textrank.TextRank
 
MAX_WORDNET_GRAPH - Static variable in class com.sharethis.textrank.TextRank
 
MAX_WORDNET_TEXT - Static variable in class com.sharethis.textrank.TextRank
 
maxNeighbor(double, double) - Method in class com.sharethis.textrank.Node
Search nearest neighbors in WordNet subgraph to find the maximum rank of any adjacent SYNONYM synset.
maxUrls - Variable in class de.l3s.icrawl.crawler.ArchiveCrawler.ZipFileStorerConfig
 
MediawikiModule - Class in net.sourceforge.jwbf.mapper
 
MediawikiModule() - Constructor for class net.sourceforge.jwbf.mapper.MediawikiModule
 
merge(Collection<DocumentVector>, boolean) - Static method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
merge(CrawlUrl) - Method in class de.l3s.icrawl.crawler.CrawlUrl
Merge with other instance.
MergeExternalUrls - Class in de.l3s.icrawl.crawler.tools
 
MergeExternalUrls() - Constructor for class de.l3s.icrawl.crawler.tools.MergeExternalUrls
 
META_ATTRIBUTE_NAMES - Static variable in class de.l3s.icrawl.util.DateUtils
 
metric - Variable in class com.sharethis.textrank.MetricVector
Public members.
metric_space - Variable in class com.sharethis.textrank.TextRank
 
MetricVector - Class in com.sharethis.textrank
Implements a point in the vector space representing the distance metric.
MetricVector(NodeValue, double, double, double) - Constructor for class com.sharethis.textrank.MetricVector
Constructor.
MIN_NORMALIZED_RANK - Static variable in class com.sharethis.textrank.TextRank
 

N

name() - Method in class io.mola.galimatias.NameValue
 
NamedEntity - Class in de.l3s.icrawl.domain.specification
 
NamedEntity(NamedEntity.Type, String) - Constructor for class de.l3s.icrawl.domain.specification.NamedEntity
 
NamedEntity(NamedEntity.Type, Set<NamedEntity.Label>) - Constructor for class de.l3s.icrawl.domain.specification.NamedEntity
 
NamedEntity(NamedEntity.Type, NamedEntity.Label...) - Constructor for class de.l3s.icrawl.domain.specification.NamedEntity
 
NamedEntity.Label - Class in de.l3s.icrawl.domain.specification
An entity label.
NamedEntity.Type - Enum in de.l3s.icrawl.domain.specification
 
NameValue - Class in io.mola.galimatias
A name-value pair.
NameValue(String, String) - Constructor for class io.mola.galimatias.NameValue
 
net.sourceforge.jwbf.core.contentRep - package net.sourceforge.jwbf.core.contentRep
 
net.sourceforge.jwbf.mapper - package net.sourceforge.jwbf.mapper
 
net.sourceforge.jwbf.mediawiki.actions.misc - package net.sourceforge.jwbf.mediawiki.actions.misc
 
newInstance(Class<T>) - Static method in class org.openimaj.io.IOUtils
Create a new instance of the given class.
next() - Method in class de.l3s.icrawl.crawler.frontier.WeightedRandomSelector
 
NGram - Class in com.sharethis.textrank
Implements a wrapper for tallying an n-gram in the text contains of selected keywords.
ngram_subgraph - Variable in class com.sharethis.textrank.TextRank
 
NLP_RESOURCES - Static variable in class com.sharethis.textrank.TextRank
Public definitions.
Node - Class in com.sharethis.textrank
Implements a node in the TextRank graph, denoting some noun or adjective morpheme.
node_list - Variable in class com.sharethis.textrank.Graph
Protected members.
node_list - Variable in class com.sharethis.textrank.Sentence
 
nodes - Variable in class com.sharethis.textrank.NGram
Public members.
NodeValue - Class in com.sharethis.textrank
Implements a node value in a TextRank graph.
NodeValue() - Constructor for class com.sharethis.textrank.NodeValue
 
normalize(String) - Method in class de.l3s.icrawl.crawler.urls.RegexUrlNormalizer
 
normalize(String) - Method in class de.l3s.icrawl.crawler.urls.UrlCanonicalizerNormalizer
 
normalize(String) - Method in interface de.l3s.icrawl.crawler.urls.UrlNormalizer
 
normalize(String) - Method in class de.l3s.icrawl.crawler.urls.UrlNormalizers
 
NUM_URLS - Static variable in class de.l3s.icrawl.crawler.Crawler
 
NumberOfUrlsStoppingCriterion - Class in de.l3s.icrawl.crawler.scheduling
 
NumberOfUrlsStoppingCriterion(long) - Constructor for class de.l3s.icrawl.crawler.scheduling.NumberOfUrlsStoppingCriterion
 

O

onApplicationEvent(EmbeddedServletContainerInitializedEvent) - Method in class de.l3s.icrawl.crawler.ArchiveCrawler
 
ONLY_HTTP - Static variable in interface de.l3s.icrawl.crawler.urls.UrlFilter
 
OnlyHtmlCharsetDetector - Class in de.l3s.icrawl.snapshots
Charset detector for HTML files.
OnlyHtmlCharsetDetector() - Constructor for class de.l3s.icrawl.snapshots.OnlyHtmlCharsetDetector
 
open(SnaphotLocation) - Method in class de.l3s.icrawl.snapshots.HdfsSnapshotReader
 
open(SnaphotLocation) - Method in interface de.l3s.icrawl.snapshots.SnapshotReader
Open a reader at the given location.
org.openimaj.io - package org.openimaj.io
 
org.openimaj.io.wrappers - package org.openimaj.io.wrappers
 
org.openimaj.text.nlp.language - package org.openimaj.text.nlp.language
 
outgoing - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
outlink(String, float, ZonedDateTime) - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
OUTPUT_DIRECTORY - Static variable in interface de.l3s.icrawl.crawler.io.ResultStorer
 
outputDirectory - Variable in class de.l3s.icrawl.crawler.ArchiveCrawler.CsvStorerConfig
 
outputDirectory - Variable in class de.l3s.icrawl.crawler.ArchiveCrawler.ZipFileStorerConfig
 

P

parse(String) - Static method in class io.mola.galimatias.FormURLEncodedParser
Charset defaults to UTF-8.
parse(String, Charset) - Static method in class io.mola.galimatias.FormURLEncodedParser
 
ParsedPage - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
ParsedPage.Category - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage.InterWikiLink - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage.LangLink - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage.Link - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage.Redirect - Class in net.sourceforge.jwbf.core.contentRep
 
ParsedPage.Section - Class in net.sourceforge.jwbf.core.contentRep
 
parseHtml(InputStream, String) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
parseHtml(String, String) - Static method in class de.l3s.icrawl.util.WebPageUtils
 
ParsePage - Class in net.sourceforge.jwbf.mediawiki.actions.misc
 
ParsePage(String, Set<ParsePage.ParseProp>, boolean, Integer, String, MediaWiki.Version) - Constructor for class net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage
 
ParsePage(String, Set<ParsePage.ParseProp>, boolean, MediaWiki.Version) - Constructor for class net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage
 
ParsePage.ParseProp - Enum in net.sourceforge.jwbf.mediawiki.actions.misc
 
parseSentence(String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
parseSentence(String) - Method in class com.sharethis.textrank.LanguageModel
Tokenize and tag the sentence text.
parseTimestamp(String) - Static method in class de.l3s.icrawl.snapshots.Utils
 
pop() - Method in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
pop() - Method in interface de.l3s.icrawl.crawler.frontier.Frontier
 
popInternal() - Method in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
popInternal() - Method in class de.l3s.icrawl.crawler.frontier.FileBasedFrontier
 
popInternal() - Method in class de.l3s.icrawl.crawler.frontier.InMemoryFrontier
 
pos - Variable in class com.sharethis.textrank.KeyWord
Public members.
postProcessAfterInitialization(Object, String) - Method in class de.l3s.icrawl.crawler.ui.UiConfig.RequestMappingHandlerMappingPostProcessor
 
postProcessBeforeInitialization(Object, String) - Method in class de.l3s.icrawl.crawler.ui.UiConfig.RequestMappingHandlerMappingPostProcessor
 
prepare() - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
prepare() - Method in class de.l3s.icrawl.crawler.yarn.Client
 
prepare() - Method in class de.l3s.icrawl.crawler.yarn.EvaluationClient
 
prepCall(String, boolean) - Method in class com.sharethis.textrank.TextRank
Prepare to call algorithm with a new text to analyze.
processReturningText(String, HttpAction) - Method in class net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage
 
PROFILE_EVALUATION - Static variable in class de.l3s.icrawl.crawler.ArchiveCrawler
 
PROFILE_EXTRACT - Static variable in class de.l3s.icrawl.crawler.ArchiveCrawler
 
progress - Variable in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
push(Collection<CrawlUrl>) - Method in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
push(Collection<CrawlUrl>) - Method in interface de.l3s.icrawl.crawler.frontier.Frontier
 
pushInternal(CrawlUrl) - Method in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
pushInternal(CrawlUrl) - Method in class de.l3s.icrawl.crawler.frontier.FileBasedFrontier
 
pushInternal(CrawlUrl) - Method in class de.l3s.icrawl.crawler.frontier.InMemoryFrontier
 

Q

QueryKeywordsCreator - Class in de.l3s.icrawl.crawler.tools
 
QueryKeywordsCreator() - Constructor for class de.l3s.icrawl.crawler.tools.QueryKeywordsCreator
 
QueueEmptyCriterion - Class in de.l3s.icrawl.crawler.scheduling
 
QueueEmptyCriterion(long, TimeUnit) - Constructor for class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 

R

rank - Variable in class com.sharethis.textrank.Node
 
rank(String, Locale, int) - Method in class de.l3s.icrawl.contentanalysis.TextRankWrapper
get the top k keywords of a text by using the TextRank algorithm
read() - Method in class de.l3s.icrawl.util.ByteBufferBackedInputStream
 
read(byte[], int, int) - Method in class de.l3s.icrawl.util.ByteBufferBackedInputStream
 
read(InputStream, T) - Static method in class org.openimaj.io.IOUtils
Read an instance of an object from an input stream.
Readable2DArrayBinary - Class in org.openimaj.io.wrappers
A wrapper for List that is readable.
Readable2DArrayBinary(double[][]) - Constructor for class org.openimaj.io.wrappers.Readable2DArrayBinary
Construct with a backing matrix
ReadableArrayBinary<V> - Class in org.openimaj.io.wrappers
A wrapper for List that is readable.
ReadableArrayBinary(V[]) - Constructor for class org.openimaj.io.wrappers.ReadableArrayBinary
Construct with a backing list
ReadableBinary - Interface in org.openimaj.io
Interface for objects capable of deserialising themselves from binary formats.
readBinary(DataInput) - Method in interface org.openimaj.io.ReadableBinary
Read internal state from in.
readBinary(DataInput) - Method in class org.openimaj.io.wrappers.Readable2DArrayBinary
 
readBinary(DataInput) - Method in class org.openimaj.io.wrappers.ReadableArrayBinary
 
readBinary(DataInput) - Method in class org.openimaj.text.nlp.language.LanguageModel
 
readFile(File) - Static method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
readIdfDictionary(InputStream) - Static method in class de.l3s.icrawl.contentanalysis.LanguageModels
 
readLanguageModel(Locale, InputStream) - Static method in class de.l3s.icrawl.contentanalysis.LanguageModels
 
readSnapshot(ArchiveRecord) - Method in class de.l3s.icrawl.snapshots.ArchiveRecordParser
 
readValue(DataInput) - Method in class org.openimaj.io.wrappers.ReadableArrayBinary
 
ReadWriteableBinary - Interface in org.openimaj.io
Interface for objects capable of serialising and deserialising themselves to and from binary format.
Redirect() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
RegexUrlNormalizer - Class in de.l3s.icrawl.crawler.urls
 
RegexUrlNormalizer(URL) - Constructor for class de.l3s.icrawl.crawler.urls.RegexUrlNormalizer
 
RELEVANCE_THRESHOLD - Static variable in class de.l3s.icrawl.crawler.Crawler
 
removeListener(StoppingCriterion.StopListener) - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
render() - Method in class com.sharethis.textrank.MetricVector
Serialize as text.
renderContexts() - Method in class com.sharethis.textrank.NGram
Short-cut replacement for a toString() method.
RequestMappingHandlerMappingPostProcessor() - Constructor for class de.l3s.icrawl.crawler.ui.UiConfig.RequestMappingHandlerMappingPostProcessor
 
resolve(SnaphotLocation) - Method in class de.l3s.icrawl.snapshots.DirectoryPrefixResolver
 
resolve(SnaphotLocation) - Method in interface de.l3s.icrawl.snapshots.LocationResolver
 
Resource - Class in de.l3s.icrawl.crawler
 
Resource(CrawlUrl, Map<String, String>, String) - Constructor for class de.l3s.icrawl.crawler.Resource
 
ResourceAnalyser - Class in de.l3s.icrawl.crawler.analysis
 
ResourceAnalyser(ArchiveCrawlSpecification, ResourceAnalyser.WeightingMethod, MetricRegistry, float, float) - Constructor for class de.l3s.icrawl.crawler.analysis.ResourceAnalyser
 
ResourceAnalyser.Factory - Class in de.l3s.icrawl.crawler.analysis
 
ResourceAnalyser.Result - Class in de.l3s.icrawl.crawler.analysis
 
ResourceAnalyser.WeightingMethod - Enum in de.l3s.icrawl.crawler.analysis
 
ResourceAnalyserFactory - Interface in de.l3s.icrawl.crawler.analysis
 
ResourceNotFoundException(String) - Constructor for exception de.l3s.icrawl.crawler.ui.UiConfig.ResourceNotFoundException
 
ResultStorer - Interface in de.l3s.icrawl.crawler.io
 
ResultStorer.Factory - Interface in de.l3s.icrawl.crawler.io
 
run() - Method in class de.l3s.icrawl.crawler.CrawlerThread
 
run(String[]) - Method in class de.l3s.icrawl.crawler.yarn.BaseAppMaster
 
run(String[]) - Method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
runTextRank() - Method in class com.sharethis.textrank.Graph
Run through N iterations of the TreeRank algorithm, or until the standard error converges below a given threshold.

S

s - Variable in class com.sharethis.textrank.Context
Public members.
scrubToken(String) - Method in class com.sharethis.textrank.LanguageModel
Clean the text for a token.
Section() - Constructor for class net.sourceforge.jwbf.core.contentRep.ParsedPage.Section
 
seenUrls - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
Sentence - Class in com.sharethis.textrank
 
Sentence(String, String[], String[]) - Constructor for class com.sharethis.textrank.Sentence
Constructor.
serializeGraph(Set<String>) - Method in class com.sharethis.textrank.Node
Traverse the graph, serializing out the nodes and edges.
setLanguageModels(LanguageModels) - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
setPageId(String) - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
setRedirects(List<ParsedPage.Redirect>) - Method in class net.sourceforge.jwbf.core.contentRep.ParsedPage
 
setupModule(Module.SetupContext) - Method in class net.sourceforge.jwbf.mapper.MediawikiModule
 
show(String) - Method in class de.l3s.icrawl.crawler.ui.InfoController
 
shutdown() - Method in class de.l3s.icrawl.crawler.Crawler
 
SnaphotLocation - Class in de.l3s.icrawl.snapshots
 
SnaphotLocation(String, ZonedDateTime, String, long, long, String, String) - Constructor for class de.l3s.icrawl.snapshots.SnaphotLocation
 
Snapshot - Class in de.l3s.icrawl.snapshots
 
Snapshot(String, ZonedDateTime, int, String, Map<String, String>, Object) - Constructor for class de.l3s.icrawl.snapshots.Snapshot
 
SnapshotReader - Interface in de.l3s.icrawl.snapshots
 
SNAPSHOTS_TO_ANALYZE - Static variable in class de.l3s.icrawl.crawler.Crawler
 
SnapshotsLocator - Interface in de.l3s.icrawl.snapshots
 
sortResults(long) - Method in class com.sharethis.textrank.Graph
Sort results to identify potential keywords.
splitParagraph(String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
splitParagraph(String) - Method in class com.sharethis.textrank.LanguageModel
Split sentences within the paragraph text.
STANDARD_ERROR_THRESHOLD - Static variable in class com.sharethis.textrank.Graph
 
start - Variable in class com.sharethis.textrank.Context
 
start_time - Variable in class com.sharethis.textrank.TextRank
 
status() - Method in class de.l3s.icrawl.crawler.ui.InfoController
 
stemToken(String) - Method in class com.sharethis.textrank.CoreNlpLanguageModel
 
stemToken(String) - Method in class com.sharethis.textrank.LanguageModel
Perform stemming on the given token.
stop(boolean) - Method in class de.l3s.icrawl.crawler.Crawler
 
stop() - Method in class de.l3s.icrawl.crawler.CrawlerThread
 
stop() - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
stop() - Method in interface de.l3s.icrawl.crawler.scheduling.StoppingCriterion.StopListener
 
stop() - Method in class de.l3s.icrawl.crawler.ui.InfoController
 
StoppingCriterion - Class in de.l3s.icrawl.crawler.scheduling
 
StoppingCriterion() - Constructor for class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
StoppingCriterion.StopListener - Interface in de.l3s.icrawl.crawler.scheduling
 
store(CrawledResource) - Method in class de.l3s.icrawl.crawler.io.CsvStorer
 
store(CrawledResource) - Method in class de.l3s.icrawl.crawler.io.LoggingStorer
 
store(CrawledResource) - Method in interface de.l3s.icrawl.crawler.io.ResultStorer
 
store(CrawledResource) - Method in class de.l3s.icrawl.crawler.io.ZipFileStorer
 
storeNotFound(CrawlUrl) - Method in class de.l3s.icrawl.crawler.io.CsvStorer
 
storeNotFound(CrawlUrl) - Method in class de.l3s.icrawl.crawler.io.LoggingStorer
 
storeNotFound(CrawlUrl) - Method in interface de.l3s.icrawl.crawler.io.ResultStorer
 
storeNotFound(CrawlUrl) - Method in class de.l3s.icrawl.crawler.io.ZipFileStorer
 
storerFactory(Configuration) - Method in class de.l3s.icrawl.crawler.ArchiveCrawler.CsvStorerConfig
 
storerFactory(Configuration) - Method in interface de.l3s.icrawl.crawler.ArchiveCrawler.StorerConfig
 
storerFactory(Configuration) - Method in class de.l3s.icrawl.crawler.ArchiveCrawler.ZipFileStorerConfig
 
StripParametersCanonicalizer(Pattern) - Constructor for class de.l3s.icrawl.crawler.urls.UrlCanonicalizerNormalizer.StripParametersCanonicalizer
 
synset_rank - Variable in class com.sharethis.textrank.MetricVector
 

T

text - Variable in class com.sharethis.textrank.NodeValue
Public members.
text - Variable in class com.sharethis.textrank.Sentence
Public members.
text - Variable in class com.sharethis.textrank.TextRank
 
TextExtractor - Class in de.l3s.icrawl.util
 
TextRank - Class in com.sharethis.textrank
Java implementation of the TextRank algorithm by Rada Mihalcea, et al.
TextRank(String, String) - Constructor for class com.sharethis.textrank.TextRank
Constructor.
TEXTRANK_DAMPING_FACTOR - Static variable in class com.sharethis.textrank.Graph
 
TextRankWrapper - Class in de.l3s.icrawl.contentanalysis
Class wrapping an implementation of the TextRank algorithm for extracting keywords of a text.
TextRankWrapper() - Constructor for class de.l3s.icrawl.contentanalysis.TextRankWrapper
 
TextRankWrapper.LANG_CODE - Enum in de.l3s.icrawl.contentanalysis
 
TimeSpecification - Class in de.l3s.icrawl.crawler
 
to - Variable in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
tofragment - Variable in class net.sourceforge.jwbf.core.contentRep.ParsedPage.Redirect
 
TOKEN_LENGTH_LIMIT - Static variable in class com.sharethis.textrank.LanguageModel
Public definitions.
token_list - Variable in class com.sharethis.textrank.Sentence
 
topComponents(int) - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
topK(Multiset<T>, int) - Static method in class de.l3s.icrawl.contentanalysis.ContentAnalyser.Counts
 
topN(int) - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
toString() - Method in class com.sharethis.textrank.TextRank
Serialize resulting graph to a string.
toString() - Method in class de.l3s.icrawl.contentanalysis.DocumentVector
 
toString() - Method in class de.l3s.icrawl.contentanalysis.DocumentVectorSimilarity
 
toString() - Method in class de.l3s.icrawl.contentanalysis.WebPageDateExtractor.WebPageDate
 
toString() - Method in class de.l3s.icrawl.crawler.CrawledResource
 
toString() - Method in class de.l3s.icrawl.crawler.CrawlUrl
 
toString() - Method in class de.l3s.icrawl.crawler.TimeSpecification
 
toString() - Method in class de.l3s.icrawl.domain.specification.NamedEntity.Label
 
toString() - Method in class de.l3s.icrawl.domain.specification.NamedEntity
 
toString() - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
toString() - Method in class de.l3s.icrawl.snapshots.Snapshot
 
toString(ZonedDateTime) - Static method in class de.l3s.icrawl.snapshots.Utils
 
toString() - Method in class io.mola.galimatias.NameValue
 
toString() - Method in class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
 
totalIncoming - Variable in class de.l3s.icrawl.crawler.frontier.BaseFrontier
 
train(Locale, String, String) - Method in class org.openimaj.text.nlp.language.MarkovChainLanguageModel
Add an example to a language's markov chain
train(Locale, InputStream) - Method in class org.openimaj.text.nlp.language.MarkovChainLanguageModel
Train a given ;anguage on a stream of text

U

UiConfig - Class in de.l3s.icrawl.crawler.ui
 
UiConfig() - Constructor for class de.l3s.icrawl.crawler.ui.UiConfig
 
UiConfig.RequestMappingHandlerMappingPostProcessor - Class in de.l3s.icrawl.crawler.ui
 
UiConfig.ResourceNotFoundException - Exception in de.l3s.icrawl.crawler.ui
 
updateEmptyQueue() - Method in class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
updateEmptyQueue() - Method in class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 
updateEmptyQueue() - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
updateFailure() - Method in class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
updateFailure() - Method in class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 
updateFailure() - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
updateIrrelevant(double) - Method in class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
updateIrrelevant(double) - Method in class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 
updateIrrelevant(double) - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
updateSuccess(double) - Method in class de.l3s.icrawl.crawler.scheduling.CompositeStoppingCriterion
 
updateSuccess(double) - Method in class de.l3s.icrawl.crawler.scheduling.NumberOfUrlsStoppingCriterion
 
updateSuccess(double) - Method in class de.l3s.icrawl.crawler.scheduling.QueueEmptyCriterion
 
updateSuccess(double) - Method in class de.l3s.icrawl.crawler.scheduling.StoppingCriterion
 
uploadTempFile(Path, Configuration, String, String) - Static method in class de.l3s.icrawl.crawler.yarn.BaseClient
 
UrlCanonicalizerNormalizer - Class in de.l3s.icrawl.crawler.urls
 
UrlCanonicalizerNormalizer() - Constructor for class de.l3s.icrawl.crawler.urls.UrlCanonicalizerNormalizer
 
UrlCanonicalizerNormalizer.StripParametersCanonicalizer - Class in de.l3s.icrawl.crawler.urls
 
UrlFilter - Interface in de.l3s.icrawl.crawler.urls
 
UrlNormalizer - Interface in de.l3s.icrawl.crawler.urls
 
UrlNormalizers - Class in de.l3s.icrawl.crawler.urls
 
UrlNormalizers(UrlNormalizer...) - Constructor for class de.l3s.icrawl.crawler.urls.UrlNormalizers
 
UrlNormalizers(List<UrlNormalizer>) - Constructor for class de.l3s.icrawl.crawler.urls.UrlNormalizers
 
URLSearchParameters - Class in io.mola.galimatias
 
URLSearchParameters(String) - Constructor for class io.mola.galimatias.URLSearchParameters
 
use_wordnet - Variable in class com.sharethis.textrank.TextRank
 
Utils - Class in de.l3s.icrawl.snapshots
 

V

value - Variable in class com.sharethis.textrank.MetricVector
 
value - Variable in class com.sharethis.textrank.Node
 
value() - Method in class io.mola.galimatias.NameValue
 
value - Variable in class org.openimaj.io.wrappers.Readable2DArrayBinary
The underlying Matrix
value - Variable in class org.openimaj.io.wrappers.ReadableArrayBinary
The underlying list
value - Variable in class org.openimaj.io.wrappers.Writeable2DArrayBinary
The underlying array
value - Variable in class org.openimaj.io.wrappers.WriteableArrayBinary
The underlying array
valueOf(String) - Static method in enum de.l3s.icrawl.contentanalysis.TextRankWrapper.LANG_CODE
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum de.l3s.icrawl.contentanalysis.WebPageDateExtractor.DateSource
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum de.l3s.icrawl.crawler.analysis.ResourceAnalyser.WeightingMethod
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum de.l3s.icrawl.crawler.CrawlUrl.Path
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum de.l3s.icrawl.domain.specification.NamedEntity.Type
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage.ParseProp
Returns the enum constant of this type with the specified name.
values() - Static method in enum de.l3s.icrawl.contentanalysis.TextRankWrapper.LANG_CODE
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum de.l3s.icrawl.contentanalysis.WebPageDateExtractor.DateSource
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum de.l3s.icrawl.crawler.analysis.ResourceAnalyser.WeightingMethod
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum de.l3s.icrawl.crawler.CrawlUrl.Path
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum de.l3s.icrawl.domain.specification.NamedEntity.Type
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum net.sourceforge.jwbf.mediawiki.actions.misc.ParsePage.ParseProp
Returns an array containing the constants of this enum type, in the order they are declared.

W

WebPageDate(ZonedDateTime, WebPageDateExtractor.DateSource) - Constructor for class de.l3s.icrawl.contentanalysis.WebPageDateExtractor.WebPageDate
 
WebPageDateExtractor - Class in de.l3s.icrawl.contentanalysis
 
WebPageDateExtractor() - Constructor for class de.l3s.icrawl.contentanalysis.WebPageDateExtractor
 
WebPageDateExtractor.DateSource - Enum in de.l3s.icrawl.contentanalysis
 
WebPageDateExtractor.ExtractionException - Exception in de.l3s.icrawl.contentanalysis
 
WebPageDateExtractor.WebPageDate - Class in de.l3s.icrawl.contentanalysis
 
WebPageUtils - Class in de.l3s.icrawl.util
 
WeightedLocale(String, double) - Constructor for class org.openimaj.text.nlp.language.LanguageDetector.WeightedLocale
Default constructor
WeightedRandomSelector - Class in de.l3s.icrawl.crawler.frontier
Pick a number in [0, n) such that higher numbers are picked more frequently.
WeightedRandomSelector(int, int) - Constructor for class de.l3s.icrawl.crawler.frontier.WeightedRandomSelector
 
WEIGHTING_METHOD - Static variable in class de.l3s.icrawl.crawler.Crawler
 
with(String, String) - Method in class io.mola.galimatias.URLSearchParameters
 
with(NameValue) - Method in class io.mola.galimatias.URLSearchParameters
 
withAppended(String, String) - Method in class io.mola.galimatias.URLSearchParameters
 
withAppended(NameValue) - Method in class io.mola.galimatias.URLSearchParameters
 
without(String) - Method in class io.mola.galimatias.URLSearchParameters
 
withSeedUrls(List<String>) - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
withWarcFile(String) - Method in class de.l3s.icrawl.snapshots.SnaphotLocation
 
Writeable2DArrayBinary - Class in org.openimaj.io.wrappers
A wrapper for an array that is writeable.
Writeable2DArrayBinary(double[][]) - Constructor for class org.openimaj.io.wrappers.Writeable2DArrayBinary
Construct with the given array.
WriteableArrayBinary<V> - Class in org.openimaj.io.wrappers
A wrapper for an array that is writeable.
WriteableArrayBinary(V[]) - Constructor for class org.openimaj.io.wrappers.WriteableArrayBinary
Construct with the given array.
WriteableBinary - Interface in org.openimaj.io
Interface for objects capable of serialising themselves to binary format.
writeBinary(DataOutput) - Method in class org.openimaj.io.wrappers.Writeable2DArrayBinary
 
writeBinary(DataOutput) - Method in class org.openimaj.io.wrappers.WriteableArrayBinary
 
writeBinary(DataOutput) - Method in interface org.openimaj.io.WriteableBinary
Write the content of this as binary to out.
writeBinary(DataOutput) - Method in class org.openimaj.text.nlp.language.LanguageModel
 
writeFile(File) - Method in class de.l3s.icrawl.crawler.ArchiveCrawlSpecification
 
writeValue(V, DataOutput) - Method in class org.openimaj.io.wrappers.WriteableArrayBinary
 

Z

ZipFileStorer - Class in de.l3s.icrawl.crawler.io
 
ZipFileStorer(OutputStream, int) - Constructor for class de.l3s.icrawl.crawler.io.ZipFileStorer
 
ZipFileStorerConfig() - Constructor for class de.l3s.icrawl.crawler.ArchiveCrawler.ZipFileStorerConfig
 
A B C D E F G H I K L M N O P Q R S T U V W Z 
Skip navigation links

Copyright © 2017. All rights reserved.