public class LinkDb extends NutchTool implements Tool
Modifier and Type | Class and Description |
---|---|
static class |
LinkDb.LinkDbMapper |
Modifier and Type | Field and Description |
---|---|
static String |
CURRENT_NAME |
static String |
IGNORE_EXTERNAL_LINKS |
static String |
IGNORE_INTERNAL_LINKS |
static String |
LOCK_NAME |
currentJob, currentJobNum, numJobs, results, status
Constructor and Description |
---|
LinkDb() |
LinkDb(Configuration conf) |
Modifier and Type | Method and Description |
---|---|
static void |
install(Job job,
Path linkDb) |
void |
invert(Path linkDb,
Path[] segments,
boolean normalize,
boolean filter,
boolean force) |
void |
invert(Path linkDb,
Path segmentsDir,
boolean normalize,
boolean filter,
boolean force) |
static void |
main(String[] args) |
Map<String,Object> |
run(Map<String,Object> args,
String crawlId)
Runs the tool, using a map of arguments.
|
int |
run(String[] args) |
getProgress, getStatus, killJob, stopJob
getConf, setConf
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
getConf, setConf
public static final String IGNORE_INTERNAL_LINKS
public static final String IGNORE_EXTERNAL_LINKS
public static final String CURRENT_NAME
public static final String LOCK_NAME
public LinkDb()
public LinkDb(Configuration conf)
public void invert(Path linkDb, Path segmentsDir, boolean normalize, boolean filter, boolean force) throws IOException, InterruptedException, ClassNotFoundException
public void invert(Path linkDb, Path[] segments, boolean normalize, boolean filter, boolean force) throws IOException, InterruptedException, ClassNotFoundException
public static void install(Job job, Path linkDb) throws IOException
IOException
Copyright © 2021 The Apache Software Foundation