|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||
java.lang.Objectjavax.swing.text.html.HTMLEditorKit.ParserCallback
org.apache.lenya.search.crawler.HTMLHandler
public final class HTMLHandler
DOCUMENT ME!
| Field Summary |
|---|
| Fields inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
|---|
IMPLIED |
| Constructor Summary | |
|---|---|
HTMLHandler()
Constructor - initializes variables |
|
| Method Summary | |
|---|---|
java.lang.String |
getAuthor()
Parse Content. [24] 320:1 |
java.lang.String |
getCategories()
Return categories (from META tags) |
java.lang.String |
getContents()
Return contents |
java.lang.String |
getDescription()
Return description (from META tags) |
java.lang.String |
getHREF()
Return META HREF |
java.lang.String |
getKeywords()
Return keywords (from META tags) |
java.util.List |
getLinks()
Return links |
long |
getPublished()
Return published date (from META tag) |
boolean |
getRobotFollow()
Return boolean true if links are to be followed |
boolean |
getRobotIndex()
Return boolean true if this is to be indexed |
java.lang.String |
getTitle()
Return page title |
void |
handleAnchor(javax.swing.text.MutableAttributeSet attribs)
Handle Anchor tags |
void |
handleEndTag(javax.swing.text.html.HTML.Tag tag,
int pos)
Closing tag |
void |
handleMeta(javax.swing.text.MutableAttributeSet attribs)
Handle META tags |
void |
handleSimpleTag(javax.swing.text.html.HTML.Tag tag,
javax.swing.text.MutableAttributeSet attribs,
int pos)
Handle standalone tags |
void |
handleStartTag(javax.swing.text.html.HTML.Tag tag,
javax.swing.text.MutableAttributeSet attribs,
int pos)
Opening tag |
void |
handleText(char[] text,
int pos)
Handle page text |
void |
parse(java.io.InputStream in)
Parse Content. |
| Methods inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
|---|
flush, handleComment, handleEndOfLineString, handleError |
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Constructor Detail |
|---|
public HTMLHandler()
| Method Detail |
|---|
public java.lang.String getAuthor()
getAuthor in interface ContentHandlerpublic java.lang.String getCategories()
getCategories in interface ContentHandlerpublic java.lang.String getContents()
getContents in interface ContentHandlerpublic java.lang.String getDescription()
getDescription in interface ContentHandlerpublic java.lang.String getHREF()
getHREF in interface ContentHandlerpublic java.lang.String getKeywords()
getKeywords in interface ContentHandlerpublic java.util.List getLinks()
getLinks in interface ContentHandlerpublic long getPublished()
getPublished in interface ContentHandlerpublic boolean getRobotFollow()
getRobotFollow in interface ContentHandlerpublic boolean getRobotIndex()
getRobotIndex in interface ContentHandlerpublic java.lang.String getTitle()
getTitle in interface ContentHandlerpublic void handleAnchor(javax.swing.text.MutableAttributeSet attribs)
attribs - DOCUMENT ME!
public void handleEndTag(javax.swing.text.html.HTML.Tag tag,
int pos)
handleEndTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbacktag - DOCUMENT ME!pos - DOCUMENT ME!public void handleMeta(javax.swing.text.MutableAttributeSet attribs)
attribs - DOCUMENT ME!
public void handleSimpleTag(javax.swing.text.html.HTML.Tag tag,
javax.swing.text.MutableAttributeSet attribs,
int pos)
handleSimpleTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbacktag - DOCUMENT ME!attribs - DOCUMENT ME!pos - DOCUMENT ME!
public void handleStartTag(javax.swing.text.html.HTML.Tag tag,
javax.swing.text.MutableAttributeSet attribs,
int pos)
handleStartTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbacktag - DOCUMENT ME!attribs - DOCUMENT ME!pos - DOCUMENT ME!
public void handleText(char[] text,
int pos)
handleText in class javax.swing.text.html.HTMLEditorKit.ParserCallbacktext - DOCUMENT ME!pos - DOCUMENT ME!public void parse(java.io.InputStream in)
parse in interface ContentHandlerin - DOCUMENT ME!
|
||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||