|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||
java.lang.Objectorg.apache.manifoldcf.crawler.connectors.webcrawler.BasicParseState
public class BasicParseState
This class represents the basic, outermost parse state.
| Constructor Summary | |
|---|---|
BasicParseState()
|
|
| Method Summary | |
|---|---|
void |
dealWithCharacter(char thisChar)
Deal with a character. |
void |
finishUp()
|
protected static java.lang.String |
htmlAttributeDecode(java.lang.String input)
Decode an html attribute |
protected static boolean |
isHTMLWhitespace(char x)
Is a character HTML whitespace? |
protected static java.lang.String |
mapChunk(java.lang.String input)
Map an entity reference back to a character |
protected void |
noteEndTag(java.lang.String tagName)
|
protected void |
noteTag(java.lang.String tagName,
java.util.Map attributes)
|
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Field Detail |
|---|
protected static final int BASICPARSESTATE_NORMAL
protected static final int BASICPARSESTATE_SAWLEFTBRACKET
protected static final int BASICPARSESTATE_SAWEXCLAMATION
protected static final int BASICPARSESTATE_SAWDASH
protected static final int BASICPARSESTATE_IN_COMMENT
protected static final int BASICPARSESTATE_SAWCOMMENTDASH
protected static final int BASICPARSESTATE_SAWSECONDCOMMENTDASH
protected static final int BASICPARSESTATE_IN_TAG_NAME
protected static final int BASICPARSESTATE_IN_ATTR_NAME
protected static final int BASICPARSESTATE_IN_ATTR_VALUE
protected static final int BASICPARSESTATE_IN_TAG_SAW_SLASH
protected static final int BASICPARSESTATE_IN_END_TAG_NAME
protected static final int BASICPARSESTATE_IN_ATTR_LOOKING_FOR_VALUE
protected static final int BASICPARSESTATE_IN_SINGLE_QUOTES_ATTR_VALUE
protected static final int BASICPARSESTATE_IN_DOUBLE_QUOTES_ATTR_VALUE
protected static final int BASICPARSESTATE_IN_UNQUOTED_ATTR_VALUE
protected int currentState
protected java.lang.StringBuffer currentTagNameBuffer
protected java.lang.StringBuffer currentAttrNameBuffer
protected java.lang.StringBuffer currentValueBuffer
protected java.lang.String currentTagName
protected java.lang.String currentAttrName
protected java.util.Map currentAttrMap
protected static final java.util.Map mapLookup
| Constructor Detail |
|---|
public BasicParseState()
| Method Detail |
|---|
public void dealWithCharacter(char thisChar)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFException
protected void noteTag(java.lang.String tagName,
java.util.Map attributes)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFException
protected void noteEndTag(java.lang.String tagName)
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFException
public void finishUp()
throws org.apache.manifoldcf.core.interfaces.ManifoldCFException
org.apache.manifoldcf.core.interfaces.ManifoldCFExceptionprotected static java.lang.String htmlAttributeDecode(java.lang.String input)
protected static java.lang.String mapChunk(java.lang.String input)
protected static boolean isHTMLWhitespace(char x)
|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||