org.apache.accumulo.examples.wikisearch.ingest
Class WikipediaPartitionedIngester
java.lang.Object
org.apache.hadoop.conf.Configured
org.apache.accumulo.examples.wikisearch.ingest.WikipediaPartitionedIngester
- All Implemented Interfaces:
- org.apache.hadoop.conf.Configurable, org.apache.hadoop.util.Tool
public class WikipediaPartitionedIngester
- extends org.apache.hadoop.conf.Configured
- implements org.apache.hadoop.util.Tool
Methods inherited from class org.apache.hadoop.conf.Configured |
getConf, setConf |
Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Methods inherited from interface org.apache.hadoop.conf.Configurable |
getConf, setConf |
INGEST_LANGUAGE
public static final String INGEST_LANGUAGE
- See Also:
- Constant Field Values
SPLIT_FILE
public static final String SPLIT_FILE
- See Also:
- Constant Field Values
TABLE_NAME
public static final String TABLE_NAME
- See Also:
- Constant Field Values
partFilter
public static final org.apache.hadoop.fs.PathFilter partFilter
filePattern
protected static final Pattern filePattern
WikipediaPartitionedIngester
public WikipediaPartitionedIngester()
main
public static void main(String[] args)
throws Exception
- Throws:
Exception
run
public int run(String[] args)
throws Exception
- Specified by:
run
in interface org.apache.hadoop.util.Tool
- Throws:
Exception
configurePartitionerJob
protected void configurePartitionerJob(org.apache.hadoop.mapreduce.Job job)
configureIngestJob
protected void configureIngestJob(org.apache.hadoop.mapreduce.Job job)
listFiles
protected void listFiles(org.apache.hadoop.fs.Path path,
org.apache.hadoop.fs.FileSystem fs,
List<org.apache.hadoop.fs.Path> files,
Set<String> languages)
throws IOException
- Throws:
IOException
Copyright © 2012 The Apache Software Foundation. All Rights Reserved.