public class Subcollection extends Configured implements URLFilter
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
TAG_BLACKLIST |
static java.lang.String |
TAG_COLLECTION |
static java.lang.String |
TAG_COLLECTIONS |
static java.lang.String |
TAG_ID |
static java.lang.String |
TAG_NAME |
static java.lang.String |
TAG_WHITELIST |
X_POINT_ID
Constructor and Description |
---|
Subcollection(Configuration conf) |
Subcollection(java.lang.String id,
java.lang.String name,
Configuration conf)
public Constructor
|
Modifier and Type | Method and Description |
---|---|
java.lang.String |
filter(java.lang.String urlString)
Simple "indexOf" currentFilter for matching patterns.
|
java.lang.String |
getBlackListString()
Returns blacklist String
|
java.lang.String |
getId() |
java.lang.String |
getName() |
java.util.ArrayList<java.lang.String> |
getWhiteList()
Returns whitelist
|
java.lang.String |
getWhiteListString()
Returns whitelist String
|
void |
initialize(org.w3c.dom.Element collection)
Initialize Subcollection from dom element
|
protected void |
parseList(java.util.ArrayList<java.lang.String> list,
java.lang.String text)
Create a list of patterns from chunk of text, patterns are separated with
newline
|
void |
setBlackList(java.lang.String list)
Set contents of blacklist from String
|
void |
setWhiteList(java.util.ArrayList<java.lang.String> whiteList) |
void |
setWhiteList(java.lang.String list)
Set contents of whitelist from String
|
getConf, setConf
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
getConf, setConf
public static final java.lang.String TAG_COLLECTIONS
public static final java.lang.String TAG_COLLECTION
public static final java.lang.String TAG_WHITELIST
public static final java.lang.String TAG_BLACKLIST
public static final java.lang.String TAG_NAME
public static final java.lang.String TAG_ID
public Subcollection(java.lang.String id, java.lang.String name, Configuration conf)
id
- id of SubCollectionname
- name of SubCollectionpublic Subcollection(Configuration conf)
public java.lang.String getName()
public java.lang.String getId()
public java.util.ArrayList<java.lang.String> getWhiteList()
public java.lang.String getWhiteListString()
public java.lang.String getBlackListString()
public void setWhiteList(java.util.ArrayList<java.lang.String> whiteList)
whiteList
- The whiteList to set.public java.lang.String filter(java.lang.String urlString)
rules for evaluation are as follows: 1. if pattern matches in blacklist then url is rejected 2. if pattern matches in whitelist then url is allowed 3. url is rejected
filter
in interface URLFilter
URLFilter.filter(java.lang.String)
public void initialize(org.w3c.dom.Element collection)
collection
- protected void parseList(java.util.ArrayList<java.lang.String> list, java.lang.String text)
list
- text
- public void setBlackList(java.lang.String list)
list
- the blacklist contentspublic void setWhiteList(java.lang.String list)
list
- the whitelist contentsCopyright © 2019 The Apache Software Foundation