public class WebTableReader extends NutchTool implements Tool
Modifier and Type | Class and Description |
---|---|
static class |
WebTableReader.WebTableRegexMapper
Filters the entries from the table based on a regex
|
static class |
WebTableReader.WebTableStatCombiner |
static class |
WebTableReader.WebTableStatMapper |
static class |
WebTableReader.WebTableStatReducer |
currentJob, currentJobNum, numJobs, results, status
Constructor and Description |
---|
WebTableReader() |
Modifier and Type | Method and Description |
---|---|
static void |
main(java.lang.String[] args) |
void |
processDumpJob(java.lang.String output,
Configuration config,
java.lang.String regex,
boolean content,
boolean headers,
boolean links,
boolean text) |
void |
processStatJob(boolean sort) |
java.util.Map<java.lang.String,java.lang.Object> |
run(java.util.Map<java.lang.String,java.lang.Object> args)
Runs the tool, using a map of arguments.
|
int |
run(java.lang.String[] args) |
getProgress, getStatus, killJob, stopJob
getConf, setConf
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
getConf, setConf
public void processStatJob(boolean sort) throws java.lang.Exception
java.lang.Exception
public void processDumpJob(java.lang.String output, Configuration config, java.lang.String regex, boolean content, boolean headers, boolean links, boolean text) throws java.io.IOException, java.lang.ClassNotFoundException, java.lang.InterruptedException
java.io.IOException
java.lang.ClassNotFoundException
java.lang.InterruptedException
public static void main(java.lang.String[] args) throws java.lang.Exception
java.lang.Exception
public int run(java.lang.String[] args) throws java.lang.Exception
public java.util.Map<java.lang.String,java.lang.Object> run(java.util.Map<java.lang.String,java.lang.Object> args) throws java.lang.Exception
NutchTool
Copyright © 2019 The Apache Software Foundation