protected static class RobotsManager.RobotsData
extends java.lang.Object
| Modifier and Type | Field and Description |
|---|---|
protected long |
expiration |
protected java.util.ArrayList |
records |
| Constructor and Description |
|---|
RobotsData(java.io.InputStream is,
long expiration,
java.lang.String hostName,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities)
Constructor.
|
| Modifier and Type | Method and Description |
|---|---|
long |
getExpirationTime()
Get expiration
|
boolean |
isFetchAllowed(java.lang.String userAgent,
java.lang.String pathString)
Check if fetch is allowed
|
protected void |
parseRobotsTxt(java.io.BufferedReader r,
java.lang.String hostName,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities)
Parse the robots.txt file using a reader.
|
public RobotsData(java.io.InputStream is,
long expiration,
java.lang.String hostName,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities)
throws java.io.IOException,
org.apache.manifoldcf.core.interfaces.ManifoldCFException
java.io.IOExceptionorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic boolean isFetchAllowed(java.lang.String userAgent,
java.lang.String pathString)
public long getExpirationTime()
protected void parseRobotsTxt(java.io.BufferedReader r,
java.lang.String hostName,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities)
throws java.io.IOException,
org.apache.manifoldcf.core.interfaces.ManifoldCFException
java.io.IOExceptionorg.apache.manifoldcf.core.interfaces.ManifoldCFException