public abstract class BaseLinkExtractor
extends org.xml.sax.helpers.DefaultHandler
implements java.io.Serializable
Modifier and Type | Field and Description |
---|---|
protected java.lang.StringBuilder |
_curAnchor |
protected java.lang.String |
_curRelAttributes |
protected java.lang.String |
_curUrl |
protected java.lang.String |
_inAnchorTag |
protected java.util.Set<java.lang.String> |
_linkAttributeTypes |
protected java.util.Set<java.lang.String> |
_linkTags |
static java.util.Set<java.lang.String> |
ALL_LINK_ATTRIBUTE_TYPES |
static java.util.Set<java.lang.String> |
ALL_LINK_TAGS |
static java.util.Set<java.lang.String> |
DEFAULT_LINK_ATTRIBUTE_TYPES |
static java.util.Set<java.lang.String> |
DEFAULT_LINK_TAGS |
Constructor and Description |
---|
BaseLinkExtractor() |
Modifier and Type | Method and Description |
---|---|
void |
addLink(Outlink link) |
void |
characters(char[] ch,
int start,
int length) |
void |
endElement(java.lang.String uri,
java.lang.String localName,
java.lang.String name) |
java.util.Set<java.lang.String> |
getLinkAttributeTypes() |
abstract Outlink[] |
getLinks() |
java.util.Set<java.lang.String> |
getLinkTags() |
void |
reset() |
void |
setLinkAttributeTypes(java.util.Set<java.lang.String> linkAttributeTypes) |
void |
setLinkTags(java.util.Set<java.lang.String> linkTags) |
void |
startElement(java.lang.String uri,
java.lang.String localName,
java.lang.String qName,
org.xml.sax.Attributes attributes) |
public static final java.util.Set<java.lang.String> DEFAULT_LINK_TAGS
public static final java.util.Set<java.lang.String> ALL_LINK_TAGS
public static final java.util.Set<java.lang.String> DEFAULT_LINK_ATTRIBUTE_TYPES
public static final java.util.Set<java.lang.String> ALL_LINK_ATTRIBUTE_TYPES
protected java.lang.String _inAnchorTag
protected java.lang.String _curUrl
protected java.lang.String _curRelAttributes
protected java.lang.StringBuilder _curAnchor
protected java.util.Set<java.lang.String> _linkTags
protected java.util.Set<java.lang.String> _linkAttributeTypes
public void setLinkTags(java.util.Set<java.lang.String> linkTags)
linkTags
- to collect Outlink
s from
(defaults to DEFAULT_LINK_TAGS
)
SimpleLinkExtractor
simply to control the set of link tags
it processes. Instead, provide this set of link tags to
ParserPolicy
.public java.util.Set<java.lang.String> getLinkTags()
public void setLinkAttributeTypes(java.util.Set<java.lang.String> linkAttributeTypes)
linkAttributeTypes
- to collect Outlink
s from
(defaults to DEFAULT_LINK_ATTRIBUTE_TYPES
)
SimpleLinkExtractor
simply to control the set of link attributes
it processes. Instead, provide this set of attributes to
ParserPolicy
.public java.util.Set<java.lang.String> getLinkAttributeTypes()
public void reset()
public void addLink(Outlink link)
public abstract Outlink[] getLinks()
public void startElement(java.lang.String uri, java.lang.String localName, java.lang.String qName, org.xml.sax.Attributes attributes) throws org.xml.sax.SAXException
startElement
in interface org.xml.sax.ContentHandler
startElement
in class org.xml.sax.helpers.DefaultHandler
org.xml.sax.SAXException
public void characters(char[] ch, int start, int length) throws org.xml.sax.SAXException
characters
in interface org.xml.sax.ContentHandler
characters
in class org.xml.sax.helpers.DefaultHandler
org.xml.sax.SAXException
public void endElement(java.lang.String uri, java.lang.String localName, java.lang.String name) throws org.xml.sax.SAXException
endElement
in interface org.xml.sax.ContentHandler
endElement
in class org.xml.sax.helpers.DefaultHandler
org.xml.sax.SAXException
Copyright © 2012 Bixo Labs