public class ContentLimiter
extends org.apache.manifoldcf.agents.transformation.BaseTransformationConnector
| Modifier and Type | Class and Description |
|---|---|
protected static interface |
ContentLimiter.DestinationStorage |
protected static class |
ContentLimiter.FileDestinationStorage |
protected static class |
ContentLimiter.MemoryDestinationStorage |
protected static class |
ContentLimiter.SpecPacker |
| Modifier and Type | Field and Description |
|---|---|
protected static java.lang.String[] |
activitiesList |
protected static java.lang.String |
ACTIVITY_LIMIT |
protected static long |
inMemoryMaximumFile
We handle up to 64K in memory; after that we go to disk.
|
_rcsid| Constructor and Description |
|---|
ContentLimiter()
Constructor.
|
| Modifier and Type | Method and Description |
|---|---|
int |
addOrReplaceDocumentWithException(java.lang.String documentURI,
org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
org.apache.manifoldcf.agents.interfaces.RepositoryDocument document,
java.lang.String authorityNameString,
org.apache.manifoldcf.agents.interfaces.IOutputAddActivity activities)
Add (or replace) a document in the output data store using the connector.
|
boolean |
checkLengthIndexable(org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
long length,
org.apache.manifoldcf.agents.interfaces.IOutputCheckActivity activities) |
boolean |
checkMimeTypeIndexable(org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
java.lang.String mimeType,
org.apache.manifoldcf.agents.interfaces.IOutputCheckActivity activities)
Detect if a mime type is indexable or not.
|
protected static void |
fillInContentSpecificationMap(java.util.Map<java.lang.String,java.lang.Object> paramMap,
org.apache.manifoldcf.core.interfaces.Specification os) |
protected static java.util.Set<java.lang.String> |
fillSet(java.lang.String input) |
java.lang.String[] |
getActivitiesList()
Return a list of activities that this connector generates.
|
java.lang.String |
getFormCheckJavascriptMethodName(int connectionSequenceNumber)
Obtain the name of the form check javascript method to call.
|
java.lang.String |
getFormPresaveCheckJavascriptMethodName(int connectionSequenceNumber)
Obtain the name of the form presave check javascript method to call.
|
org.apache.manifoldcf.core.interfaces.VersionContext |
getPipelineDescription(org.apache.manifoldcf.core.interfaces.Specification os)
Get an output version string, given an output specification.
|
protected static int |
handleIOException(java.io.IOException e) |
void |
outputSpecificationBody(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber,
int actualSequenceNumber,
java.lang.String tabName)
Output the specification body section.
|
void |
outputSpecificationHeader(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber,
java.util.List<java.lang.String> tabsArray)
Output the specification header section.
|
java.lang.String |
processSpecificationPost(org.apache.manifoldcf.core.interfaces.IPostParameters variableContext,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber)
Process a specification post.
|
void |
viewSpecification(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber)
View specification.
|
checkDateIndexable, checkDocumentIndexable, checkURLIndexable, requestInfocheck, clearThreadContext, connect, deinstall, disconnect, getConfiguration, install, isConnected, outputConfigurationBody, outputConfigurationBody, outputConfigurationHeader, outputConfigurationHeader, outputConfigurationHeader, pack, packFixedList, packList, packList, poll, processConfigurationPost, processConfigurationPost, setThreadContext, unpack, unpackFixedList, unpackList, viewConfiguration, viewConfigurationclone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, waitcheck, clearThreadContext, connect, deinstall, disconnect, getConfiguration, install, isConnected, outputConfigurationBody, outputConfigurationHeader, poll, processConfigurationPost, setThreadContext, viewConfigurationprotected static final java.lang.String ACTIVITY_LIMIT
protected static final java.lang.String[] activitiesList
protected static final long inMemoryMaximumFile
public java.lang.String[] getActivitiesList()
getActivitiesList in interface org.apache.manifoldcf.agents.interfaces.ITransformationConnectorgetActivitiesList in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorpublic org.apache.manifoldcf.core.interfaces.VersionContext getPipelineDescription(org.apache.manifoldcf.core.interfaces.Specification os)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
org.apache.manifoldcf.agents.interfaces.ServiceInterruption
getPipelineDescription in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorgetPipelineDescription in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectoros - is the current output specification for the job that is doing the crawling.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionorg.apache.manifoldcf.agents.interfaces.ServiceInterruptionpublic boolean checkMimeTypeIndexable(org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
java.lang.String mimeType,
org.apache.manifoldcf.agents.interfaces.IOutputCheckActivity activities)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
org.apache.manifoldcf.agents.interfaces.ServiceInterruption
checkMimeTypeIndexable in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorcheckMimeTypeIndexable in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectoroutputDescription - is the document's output version.mimeType - is the mime type of the document.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionorg.apache.manifoldcf.agents.interfaces.ServiceInterruptionpublic boolean checkLengthIndexable(org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
long length,
org.apache.manifoldcf.agents.interfaces.IOutputCheckActivity activities)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
org.apache.manifoldcf.agents.interfaces.ServiceInterruption
checkLengthIndexable in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorcheckLengthIndexable in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectororg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionorg.apache.manifoldcf.agents.interfaces.ServiceInterruptionpublic int addOrReplaceDocumentWithException(java.lang.String documentURI,
org.apache.manifoldcf.core.interfaces.VersionContext outputDescription,
org.apache.manifoldcf.agents.interfaces.RepositoryDocument document,
java.lang.String authorityNameString,
org.apache.manifoldcf.agents.interfaces.IOutputAddActivity activities)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
org.apache.manifoldcf.agents.interfaces.ServiceInterruption,
java.io.IOException
addOrReplaceDocumentWithException in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectoraddOrReplaceDocumentWithException in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectordocumentURI - is the URI of the document. The URI is presumed to be the unique identifier which the output data store will use to process
and serve the document. This URI is constructed by the repository connector which fetches the document, and is thus universal across all output connectors.outputDescription - is the description string that was constructed for this document by the getOutputDescription() method.document - is the document data to be processed (handed to the output data store).authorityNameString - is the name of the authority responsible for authorizing any access tokens passed in with the repository document. May be null.activities - is the handle to an object that the implementer of an output connector may use to perform operations, such as logging processing activity.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionorg.apache.manifoldcf.agents.interfaces.ServiceInterruptionjava.io.IOExceptionprotected static void fillInContentSpecificationMap(java.util.Map<java.lang.String,java.lang.Object> paramMap,
org.apache.manifoldcf.core.interfaces.Specification os)
public java.lang.String getFormCheckJavascriptMethodName(int connectionSequenceNumber)
getFormCheckJavascriptMethodName in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorgetFormCheckJavascriptMethodName in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorconnectionSequenceNumber - is the unique number of this connection within the job.public java.lang.String getFormPresaveCheckJavascriptMethodName(int connectionSequenceNumber)
getFormPresaveCheckJavascriptMethodName in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorgetFormPresaveCheckJavascriptMethodName in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorconnectionSequenceNumber - is the unique number of this connection within the job.public void outputSpecificationHeader(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber,
java.util.List<java.lang.String> tabsArray)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
java.io.IOException
outputSpecificationHeader in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectoroutputSpecificationHeader in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorout - is the output to which any HTML should be sent.locale - is the preferred local of the output.os - is the current pipeline specification for this connection.connectionSequenceNumber - is the unique number of this connection within the job.tabsArray - is an array of tab names. Add to this array any tab names that are specific to the connector.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionjava.io.IOExceptionpublic void outputSpecificationBody(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber,
int actualSequenceNumber,
java.lang.String tabName)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
java.io.IOException
outputSpecificationBody in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectoroutputSpecificationBody in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorout - is the output to which any HTML should be sent.locale - is the preferred local of the output.os - is the current pipeline specification for this job.connectionSequenceNumber - is the unique number of this connection within the job.actualSequenceNumber - is the connection within the job that has currently been selected.tabName - is the current tab name.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionjava.io.IOExceptionpublic java.lang.String processSpecificationPost(org.apache.manifoldcf.core.interfaces.IPostParameters variableContext,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
processSpecificationPost in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorprocessSpecificationPost in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorvariableContext - contains the post data, including binary file-upload information.locale - is the preferred local of the output.os - is the current pipeline specification for this job.connectionSequenceNumber - is the unique number of this connection within the job.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void viewSpecification(org.apache.manifoldcf.core.interfaces.IHTTPOutput out,
java.util.Locale locale,
org.apache.manifoldcf.core.interfaces.Specification os,
int connectionSequenceNumber)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException,
java.io.IOException
viewSpecification in interface org.apache.manifoldcf.agents.interfaces.IPipelineConnectorviewSpecification in class org.apache.manifoldcf.agents.transformation.BaseTransformationConnectorout - is the output to which any HTML should be sent.locale - is the preferred local of the output.connectionSequenceNumber - is the unique number of this connection within the job.os - is the current pipeline specification for this job.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionjava.io.IOExceptionprotected static java.util.Set<java.lang.String> fillSet(java.lang.String input)
protected static int handleIOException(java.io.IOException e)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFException