protected static class RSSConnector.Filter extends Object
Modifier and Type | Field and Description |
---|---|
protected HashMap |
acls |
protected Integer |
badFeedRescanInterval |
protected RSSConnector.CanonicalizationPolicies |
canonicalizationPolicies |
protected int |
chromedContentMode |
protected int |
dechromedContentMode |
protected Integer |
defaultRescanInterval |
protected ArrayList |
excludePatterns
The arraylist of exclude patterns
|
protected int |
feedTimeoutValue |
protected ArrayList |
includePatterns
The arraylist of include patterns
|
protected RSSConnector.MappingRules |
mappings |
protected ArrayList |
metadata |
protected Integer |
minimumRescanInterval |
protected HashMap |
seeds |
Constructor and Description |
---|
RSSConnector.Filter(Specification spec,
boolean warnOnBadSeed)
Constructor.
|
Modifier and Type | Method and Description |
---|---|
String[] |
getAcls()
Get the acls
|
Long |
getBadFeedRescanTime(long currentTime)
Get the next time a "bad feed" should be rescanned
|
RSSConnector.CanonicalizationPolicies |
getCanonicalizationPolicies()
Get canonicalization policies
|
int |
getChromedContentMode()
Get the chromed content mode
|
int |
getDechromedContentMode()
Get the dechromed content mode
|
Long |
getDefaultRescanTime(long currentTime)
Get the next time (by default) a feed should be scanned
|
int |
getFeedTimeoutValue()
Get the feed timeout value
|
ArrayList |
getMetadata()
Get the specified metadata
|
Long |
getMinimumRescanTime(long currentTime)
Get the minimum next time a feed should be scanned
|
Iterator |
getSeeds()
Iterate over all canonicalized seeds
|
boolean |
isLegalURL(String url)
Check for legality of a url.
|
boolean |
isSeed(String canonicalUrl)
Check if document is a seed
|
String |
mapDocumentURL(String url)
Scan patterns and return the one that matches first.
|
protected RSSConnector.MappingRules mappings
protected HashMap seeds
protected Integer defaultRescanInterval
protected Integer minimumRescanInterval
protected Integer badFeedRescanInterval
protected int dechromedContentMode
protected int chromedContentMode
protected int feedTimeoutValue
protected ArrayList metadata
protected HashMap acls
protected RSSConnector.CanonicalizationPolicies canonicalizationPolicies
protected ArrayList includePatterns
protected ArrayList excludePatterns
public RSSConnector.Filter(Specification spec, boolean warnOnBadSeed) throws ManifoldCFException
ManifoldCFException
public boolean isSeed(String canonicalUrl)
public Iterator getSeeds()
public ArrayList getMetadata()
public String[] getAcls()
public int getFeedTimeoutValue()
public int getDechromedContentMode()
public int getChromedContentMode()
public Long getDefaultRescanTime(long currentTime)
public Long getMinimumRescanTime(long currentTime)
public Long getBadFeedRescanTime(long currentTime)
public boolean isLegalURL(String url)
public String mapDocumentURL(String url) throws ManifoldCFException
ManifoldCFException
public RSSConnector.CanonicalizationPolicies getCanonicalizationPolicies()