public class CrawlDbFilter extends Object implements Mapper<Text,CrawlDatum,Text,CrawlDatum>
Modifier and Type | Field and Description |
---|---|
static String |
URL_FILTERING |
static String |
URL_NORMALIZING |
static String |
URL_NORMALIZING_SCOPE |
Constructor and Description |
---|
CrawlDbFilter() |
Modifier and Type | Method and Description |
---|---|
void |
close() |
void |
configure(JobConf job) |
void |
map(Text key,
CrawlDatum value,
OutputCollector<Text,CrawlDatum> output,
Reporter reporter) |
public static final String URL_FILTERING
public static final String URL_NORMALIZING
public static final String URL_NORMALIZING_SCOPE
public void configure(JobConf job)
configure
in interface JobConfigurable
public void close()
close
in interface Closeable
close
in interface AutoCloseable
public void map(Text key, CrawlDatum value, OutputCollector<Text,CrawlDatum> output, Reporter reporter) throws IOException
map
in interface Mapper<Text,CrawlDatum,Text,CrawlDatum>
IOException
Copyright © 2017 The Apache Software Foundation