|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||
java.lang.Objectorg.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.FindHandler
org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.FindHTMLFormHandler
protected class WebcrawlerConnector.FindHTMLFormHandler
This class is the handler for HTML form parsing during state transitions
| Field Summary | |
|---|---|
protected FormDataAccumulator |
currentFormData
|
protected FormDataAccumulator |
discoveredFormData
|
protected java.util.regex.Pattern |
formNamePattern
|
| Fields inherited from class org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.FindHandler |
|---|
parentURI, targetURI |
| Constructor Summary | |
|---|---|
WebcrawlerConnector.FindHTMLFormHandler(java.lang.String parentURI,
java.util.regex.Pattern formNamePattern)
|
|
| Method Summary | |
|---|---|
void |
applyFormOverrides(LoginParameters lp)
|
FormData |
getFormData()
|
void |
noteAHREF(java.lang.String rawURL)
Note discovered href |
void |
noteFormEnd()
Note the end of a form |
void |
noteFormInput(java.util.Map inputAttributes)
Note an input tag |
void |
noteFormStart(java.util.Map formAttributes)
Note the start of a form |
void |
noteFRAMESRC(java.lang.String rawURL)
Note discovered FRAME SRC |
void |
noteIMGSRC(java.lang.String rawURL)
Note discovered IMG SRC |
void |
noteLINKHREF(java.lang.String rawURL)
Note discovered href |
void |
noteMetaTag(java.util.Map metaAttributes)
Note a meta tag |
| Methods inherited from class org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.FindHandler |
|---|
getTargetURI, noteDiscoveredLink |
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Methods inherited from interface org.apache.manifoldcf.crawler.connectors.webcrawler.IDiscoveredLinkHandler |
|---|
noteDiscoveredLink |
| Field Detail |
|---|
protected java.util.regex.Pattern formNamePattern
protected FormDataAccumulator discoveredFormData
protected FormDataAccumulator currentFormData
| Constructor Detail |
|---|
public WebcrawlerConnector.FindHTMLFormHandler(java.lang.String parentURI,
java.util.regex.Pattern formNamePattern)
| Method Detail |
|---|
public void applyFormOverrides(LoginParameters lp)
public FormData getFormData()
public void noteMetaTag(java.util.Map metaAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteMetaTag in interface IMetaTagHandlermetaAttributes - are the attributes that belong to the tag.
org.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormStart(java.util.Map formAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormStart in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormInput(java.util.Map inputAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormInput in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormEnd()
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormEnd in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteAHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteAHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteLINKHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteLINKHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteIMGSRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteIMGSRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFRAMESRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFRAMESRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||