org.apache.accumulo.examples.wikisearch.ingest
Class WikipediaIngester

java.lang.Object
  extended by org.apache.hadoop.conf.Configured
      extended by org.apache.accumulo.examples.wikisearch.ingest.WikipediaIngester
All Implemented Interfaces:
org.apache.hadoop.conf.Configurable, org.apache.hadoop.util.Tool

public class WikipediaIngester
extends org.apache.hadoop.conf.Configured
implements org.apache.hadoop.util.Tool


Field Summary
protected static Pattern filePattern
           
static String INGEST_LANGUAGE
           
static org.apache.hadoop.fs.PathFilter partFilter
           
static String SPLIT_FILE
           
static String TABLE_NAME
           
 
Constructor Summary
WikipediaIngester()
           
 
Method Summary
protected  void configureJob(org.apache.hadoop.mapreduce.Job job)
           
protected  void listFiles(org.apache.hadoop.fs.Path path, org.apache.hadoop.fs.FileSystem fs, List<org.apache.hadoop.fs.Path> files, Set<String> languages)
           
static void main(String[] args)
           
 int run(String[] args)
           
 
Methods inherited from class org.apache.hadoop.conf.Configured
getConf, setConf
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 
Methods inherited from interface org.apache.hadoop.conf.Configurable
getConf, setConf
 

Field Detail

INGEST_LANGUAGE

public static final String INGEST_LANGUAGE
See Also:
Constant Field Values

SPLIT_FILE

public static final String SPLIT_FILE
See Also:
Constant Field Values

TABLE_NAME

public static final String TABLE_NAME
See Also:
Constant Field Values

partFilter

public static final org.apache.hadoop.fs.PathFilter partFilter

filePattern

protected static final Pattern filePattern
Constructor Detail

WikipediaIngester

public WikipediaIngester()
Method Detail

main

public static void main(String[] args)
                 throws Exception
Throws:
Exception

run

public int run(String[] args)
        throws Exception
Specified by:
run in interface org.apache.hadoop.util.Tool
Throws:
Exception

configureJob

protected void configureJob(org.apache.hadoop.mapreduce.Job job)

listFiles

protected void listFiles(org.apache.hadoop.fs.Path path,
                         org.apache.hadoop.fs.FileSystem fs,
                         List<org.apache.hadoop.fs.Path> files,
                         Set<String> languages)
                  throws IOException
Throws:
IOException


Copyright © 2012 The Apache Software Foundation. All Rights Reserved.