public class CrawlDb
extends org.apache.hadoop.conf.Configured
implements org.apache.hadoop.util.Tool
Modifier and Type | Field and Description |
---|---|
static String |
CRAWLDB_ADDITIONS_ALLOWED |
static String |
CRAWLDB_PURGE_404 |
static String |
CURRENT_NAME |
static String |
LOCK_NAME |
static org.slf4j.Logger |
LOG |
Constructor and Description |
---|
CrawlDb() |
CrawlDb(org.apache.hadoop.conf.Configuration conf) |
Modifier and Type | Method and Description |
---|---|
static org.apache.hadoop.mapred.JobConf |
createJob(org.apache.hadoop.conf.Configuration config,
org.apache.hadoop.fs.Path crawlDb) |
static void |
install(org.apache.hadoop.mapred.JobConf job,
org.apache.hadoop.fs.Path crawlDb) |
static void |
main(String[] args) |
int |
run(String[] args) |
void |
update(org.apache.hadoop.fs.Path crawlDb,
org.apache.hadoop.fs.Path[] segments,
boolean normalize,
boolean filter) |
void |
update(org.apache.hadoop.fs.Path crawlDb,
org.apache.hadoop.fs.Path[] segments,
boolean normalize,
boolean filter,
boolean additionsAllowed,
boolean force) |
public static final org.slf4j.Logger LOG
public static final String CRAWLDB_ADDITIONS_ALLOWED
public static final String CRAWLDB_PURGE_404
public static final String CURRENT_NAME
public static final String LOCK_NAME
public CrawlDb()
public CrawlDb(org.apache.hadoop.conf.Configuration conf)
public void update(org.apache.hadoop.fs.Path crawlDb, org.apache.hadoop.fs.Path[] segments, boolean normalize, boolean filter) throws IOException
IOException
public void update(org.apache.hadoop.fs.Path crawlDb, org.apache.hadoop.fs.Path[] segments, boolean normalize, boolean filter, boolean additionsAllowed, boolean force) throws IOException
IOException
public static org.apache.hadoop.mapred.JobConf createJob(org.apache.hadoop.conf.Configuration config, org.apache.hadoop.fs.Path crawlDb) throws IOException
IOException
public static void install(org.apache.hadoop.mapred.JobConf job, org.apache.hadoop.fs.Path crawlDb) throws IOException
IOException
Copyright © 2014 The Apache Software Foundation