|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||
java.lang.Objectorg.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.ProcessActivityLinkHandler
org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.ProcessActivityHTMLHandler
protected class WebcrawlerConnector.ProcessActivityHTMLHandler
Class that describes HTML handling
| Field Summary |
|---|
| Fields inherited from class org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.ProcessActivityLinkHandler |
|---|
activities, contextDescription, documentIdentifier, filter, linkType |
| Constructor Summary | |
|---|---|
WebcrawlerConnector.ProcessActivityHTMLHandler(java.lang.String documentIdentifier,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities,
WebcrawlerConnector.DocumentURLFilter filter)
Constructor. |
|
| Method Summary | |
|---|---|
void |
noteAHREF(java.lang.String rawURL)
Note discovered href |
void |
noteFormEnd()
Note the end of a form |
void |
noteFormInput(java.util.Map inputAttributes)
Note an input tag |
void |
noteFormStart(java.util.Map formAttributes)
Note the start of a form |
void |
noteFRAMESRC(java.lang.String rawURL)
Note discovered FRAME SRC |
void |
noteIMGSRC(java.lang.String rawURL)
Note discovered IMG SRC |
void |
noteLINKHREF(java.lang.String rawURL)
Note discovered href |
void |
noteMetaTag(java.util.Map metaAttributes)
Note a meta tag |
boolean |
shouldIndex()
Decide whether we should index. |
| Methods inherited from class org.apache.manifoldcf.crawler.connectors.webcrawler.WebcrawlerConnector.ProcessActivityLinkHandler |
|---|
noteDiscoveredLink |
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Methods inherited from interface org.apache.manifoldcf.crawler.connectors.webcrawler.IDiscoveredLinkHandler |
|---|
noteDiscoveredLink |
| Constructor Detail |
|---|
public WebcrawlerConnector.ProcessActivityHTMLHandler(java.lang.String documentIdentifier,
org.apache.manifoldcf.crawler.interfaces.IProcessActivity activities,
WebcrawlerConnector.DocumentURLFilter filter)
| Method Detail |
|---|
public boolean shouldIndex()
public void noteMetaTag(java.util.Map metaAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteMetaTag in interface IMetaTagHandlermetaAttributes - are the attributes that belong to the tag.
org.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormStart(java.util.Map formAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormStart in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormInput(java.util.Map inputAttributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormInput in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFormEnd()
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFormEnd in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteAHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteAHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteLINKHREF(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteLINKHREF in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteIMGSRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteIMGSRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
public void noteFRAMESRC(java.lang.String rawURL)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
noteFRAMESRC in interface IHTMLHandlerorg.apache.manifoldcf.core.interfaces.ManifoldCFException
|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||