org.apache.mahout.text
Class PrefixAdditionFilter

java.lang.Object
  extended by org.apache.hadoop.conf.Configured
      extended by org.apache.mahout.common.AbstractJob
          extended by org.apache.mahout.text.SequenceFilesFromDirectory
              extended by org.apache.mahout.text.SequenceFilesFromDirectoryFilter
                  extended by org.apache.mahout.text.PrefixAdditionFilter
All Implemented Interfaces:
org.apache.hadoop.conf.Configurable, org.apache.hadoop.fs.PathFilter, org.apache.hadoop.util.Tool

public final class PrefixAdditionFilter
extends SequenceFilesFromDirectoryFilter

Default parser for parsing text into sequence files.


Field Summary
 
Fields inherited from class org.apache.mahout.text.SequenceFilesFromDirectoryFilter
charset, conf, fs, options, prefix, writer
 
Fields inherited from class org.apache.mahout.text.SequenceFilesFromDirectory
CHARSET_OPTION, CHUNK_SIZE_OPTION, FILE_FILTER_CLASS_OPTION, KEY_PREFIX_OPTION
 
Constructor Summary
PrefixAdditionFilter(org.apache.hadoop.conf.Configuration conf, String keyPrefix, Map<String,String> options, ChunkedWriter writer)
           
 
Method Summary
protected  void process(org.apache.hadoop.fs.FileStatus fst, org.apache.hadoop.fs.Path current)
           
 
Methods inherited from class org.apache.mahout.text.SequenceFilesFromDirectoryFilter
accept, getOptions
 
Methods inherited from class org.apache.mahout.text.SequenceFilesFromDirectory
addOptions, main, parseOptions, run, run
 
Methods inherited from class org.apache.mahout.common.AbstractJob
addFlag, addInputOption, addOption, addOption, addOption, addOption, addOutputOption, buildOption, getInputPath, getOption, getOutputPath, hasOption, keyFor, maybePut, parseArguments, parseDirectories, prepareJob, shouldRunNextPhase
 
Methods inherited from class org.apache.hadoop.conf.Configured
getConf, setConf
 
Methods inherited from class java.lang.Object
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
 
Methods inherited from interface org.apache.hadoop.conf.Configurable
getConf, setConf
 

Constructor Detail

PrefixAdditionFilter

public PrefixAdditionFilter(org.apache.hadoop.conf.Configuration conf,
                            String keyPrefix,
                            Map<String,String> options,
                            ChunkedWriter writer)
                     throws IOException
Throws:
IOException
Method Detail

process

protected void process(org.apache.hadoop.fs.FileStatus fst,
                       org.apache.hadoop.fs.Path current)
                throws IOException
Specified by:
process in class SequenceFilesFromDirectoryFilter
Throws:
IOException


Copyright © 2008-2011 The Apache Software Foundation. All Rights Reserved.