|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||
java.lang.Objectjavax.swing.text.html.HTMLEditorKit.ParserCallback
net.firstpartners.rp.back.extractor.util.Spider.SpiderParserCallback
public class Spider.SpiderParserCallback
Inner class
| Field Summary | |
|---|---|
private boolean |
foundSummary
flag to mark that the summary was found it |
private boolean |
isInBody
flag to mark the actual process of body tag |
private boolean |
isInScript
flag to mark the actual process of script tag |
private boolean |
isInTitle
flag to mark the actual process of title tag |
private java.lang.String |
lastText
contents of last text element |
static java.lang.String |
METADATA_AUTHOR
Author meta data |
static java.lang.String |
METADATA_DESCRIPTION
Description meta data |
static java.lang.String |
METADATA_SUMMARY
Summary meta data |
static java.lang.String |
METADATA_WEBMASTER
Webmaster meta data |
private java.lang.StringBuffer |
summaryText
summary text |
| Fields inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
|---|
IMPLIED |
| Constructor Summary | |
|---|---|
Spider.SpiderParserCallback()
Creates a new instance of SpiderParserCallback |
|
| Method Summary | |
|---|---|
void |
handleEndTag(javax.swing.text.html.HTML.Tag t,
int pos)
take care of start tags |
void |
handleSimpleTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
handle HTML tags that don't have a start and end tag |
void |
handleStartTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
take care of start tags |
void |
handleText(char[] data,
int pos)
take care of text between tags, check against keyword list for matches, if match found, set the node match status to true |
| Methods inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
|---|
flush, handleComment, handleEndOfLineString, handleError |
| Methods inherited from class java.lang.Object |
|---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Field Detail |
|---|
public static final java.lang.String METADATA_DESCRIPTION
public static final java.lang.String METADATA_SUMMARY
public static final java.lang.String METADATA_AUTHOR
public static final java.lang.String METADATA_WEBMASTER
private java.lang.String lastText
private java.lang.StringBuffer summaryText
private boolean isInTitle
private boolean isInBody
private boolean isInScript
private boolean foundSummary
| Constructor Detail |
|---|
public Spider.SpiderParserCallback()
| Method Detail |
|---|
public void handleSimpleTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
handleSimpleTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbackt - HTML taga - HTML attributespos - Position within file
public void handleStartTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
handleStartTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbackt - HTML taga - HTML attributespos - Position within file
public void handleEndTag(javax.swing.text.html.HTML.Tag t,
int pos)
handleEndTag in class javax.swing.text.html.HTMLEditorKit.ParserCallbackt - HTML tagpos - Position within file
public void handleText(char[] data,
int pos)
handleText in class javax.swing.text.html.HTMLEditorKit.ParserCallbackdata - Text between tagspos - position of text within web page
|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||