|
|||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Object javax.swing.text.html.HTMLEditorKit.ParserCallback net.firstpartners.rp.back.extractor.util.Spider.SpiderParserCallback
public class Spider.SpiderParserCallback
Inner class
Field Summary | |
---|---|
private boolean |
foundSummary
flag to mark that the summary was found it |
private boolean |
isInBody
flag to mark the actual process of body tag |
private boolean |
isInScript
flag to mark the actual process of script tag |
private boolean |
isInTitle
flag to mark the actual process of title tag |
private java.lang.String |
lastText
contents of last text element |
static java.lang.String |
METADATA_AUTHOR
Author meta data |
static java.lang.String |
METADATA_DESCRIPTION
Description meta data |
static java.lang.String |
METADATA_SUMMARY
Summary meta data |
static java.lang.String |
METADATA_WEBMASTER
Webmaster meta data |
private java.lang.StringBuffer |
summaryText
summary text |
Fields inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
---|
IMPLIED |
Constructor Summary | |
---|---|
Spider.SpiderParserCallback()
Creates a new instance of SpiderParserCallback |
Method Summary | |
---|---|
void |
handleEndTag(javax.swing.text.html.HTML.Tag t,
int pos)
take care of start tags |
void |
handleSimpleTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
handle HTML tags that don't have a start and end tag |
void |
handleStartTag(javax.swing.text.html.HTML.Tag t,
javax.swing.text.MutableAttributeSet a,
int pos)
take care of start tags |
void |
handleText(char[] data,
int pos)
take care of text between tags, check against keyword list for matches, if match found, set the node match status to true |
Methods inherited from class javax.swing.text.html.HTMLEditorKit.ParserCallback |
---|
flush, handleComment, handleEndOfLineString, handleError |
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Field Detail |
---|
public static final java.lang.String METADATA_DESCRIPTION
public static final java.lang.String METADATA_SUMMARY
public static final java.lang.String METADATA_AUTHOR
public static final java.lang.String METADATA_WEBMASTER
private java.lang.String lastText
private java.lang.StringBuffer summaryText
private boolean isInTitle
private boolean isInBody
private boolean isInScript
private boolean foundSummary
Constructor Detail |
---|
public Spider.SpiderParserCallback()
Method Detail |
---|
public void handleSimpleTag(javax.swing.text.html.HTML.Tag t, javax.swing.text.MutableAttributeSet a, int pos)
handleSimpleTag
in class javax.swing.text.html.HTMLEditorKit.ParserCallback
t
- HTML taga
- HTML attributespos
- Position within filepublic void handleStartTag(javax.swing.text.html.HTML.Tag t, javax.swing.text.MutableAttributeSet a, int pos)
handleStartTag
in class javax.swing.text.html.HTMLEditorKit.ParserCallback
t
- HTML taga
- HTML attributespos
- Position within filepublic void handleEndTag(javax.swing.text.html.HTML.Tag t, int pos)
handleEndTag
in class javax.swing.text.html.HTMLEditorKit.ParserCallback
t
- HTML tagpos
- Position within filepublic void handleText(char[] data, int pos)
handleText
in class javax.swing.text.html.HTMLEditorKit.ParserCallback
data
- Text between tagspos
- position of text within web page
|
|||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |