public class FindHTMLHrefHandler extends FindHandler implements IHTMLHandler
| Modifier and Type | Field and Description |
|---|---|
protected java.util.regex.Pattern |
preferredLinkPattern |
parentURI, targetURI| Constructor and Description |
|---|
FindHTMLHrefHandler(java.lang.String parentURI,
java.util.regex.Pattern preferredLinkPattern) |
| Modifier and Type | Method and Description |
|---|---|
void |
applyOverrides(LoginParameters lp)
Apply overrides
|
void |
finishUp()
Done with the document.
|
void |
noteAHREF(java.lang.String rawURL)
Note discovered href
|
void |
noteBASEHREF(java.lang.String rawURL)
Note discovered base
|
void |
noteDiscoveredBase(java.lang.String rawURL)
Inform the world of a new base HREF.
|
void |
noteDiscoveredLink(java.lang.String rawURL)
Override noteDiscoveredLink
|
void |
noteFormEnd()
Note the end of a form
|
void |
noteFormInput(java.util.Map inputAttributes)
Note an input tag
|
void |
noteFormStart(java.util.Map formAttributes)
Note the start of a form
|
void |
noteFRAMESRC(java.lang.String rawURL)
Note discovered FRAME SRC
|
void |
noteIMGSRC(java.lang.String rawURL)
Note discovered IMG SRC
|
void |
noteLINKHREF(java.lang.String rawURL)
Note discovered href
|
void |
noteMetaTag(java.util.Map metaAttributes)
Note a meta tag
|
void |
noteTextCharacter(char textCharacter)
Note a character of text.
|
getTargetURIpublic FindHTMLHrefHandler(java.lang.String parentURI,
java.util.regex.Pattern preferredLinkPattern)
public void applyOverrides(LoginParameters lp) throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteTextCharacter(char textCharacter)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteTextCharacter in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteMetaTag(java.util.Map metaAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteMetaTag in interface IMetaTagHandlermetaAttributes - are the attributes that belong to the tag.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteFormStart(java.util.Map formAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormStart in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteFormInput(java.util.Map inputAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormInput in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteFormEnd()
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormEnd in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteDiscoveredBase(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
IDiscoveredLinkHandlernoteDiscoveredBase in interface IDiscoveredLinkHandlernoteDiscoveredBase in class FindHandlerrawURL - is the new base HREF, in raw form. This may be relative, malformed, etc.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteDiscoveredLink(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteDiscoveredLink in interface IDiscoveredLinkHandlernoteDiscoveredLink in class FindHandlerrawURL - is the raw discovered url. This may be relative, malformed, or otherwise unsuitable for use until final form is acheived.org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteBASEHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteBASEHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteAHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteAHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteLINKHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteLINKHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteIMGSRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteIMGSRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void noteFRAMESRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFRAMESRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFExceptionpublic void finishUp()
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
IHTMLHandlerfinishUp in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException