public class EsInputFormat<K,V>
extends org.apache.hadoop.mapreduce.InputFormat<K,V>
implements org.apache.hadoop.mapred.InputFormat<K,V>
InputFormat
for streaming data (typically based on a query) from ElasticSearch.
Returns the document ID as key and its content as value.
This class implements both the "old" (org.apache.hadoop.mapred) and the "new" (org.apache.hadoop.mapreduce) API.Modifier and Type | Class and Description |
---|---|
protected static class |
EsInputFormat.AbstractWritableEsInputRecordReader<V> |
protected static class |
EsInputFormat.EsInputRecordReader<K,V> |
protected static class |
EsInputFormat.EsInputSplit |
protected static class |
EsInputFormat.JsonWritableEsInputRecordReader |
protected static class |
EsInputFormat.WritableEsInputRecordReader |
Constructor and Description |
---|
EsInputFormat() |
Modifier and Type | Method and Description |
---|---|
EsInputFormat.EsInputRecordReader<K,V> |
createRecordReader(org.apache.hadoop.mapreduce.InputSplit split,
org.apache.hadoop.mapreduce.TaskAttemptContext context) |
EsInputFormat.EsInputRecordReader<K,V> |
getRecordReader(org.apache.hadoop.mapred.InputSplit split,
org.apache.hadoop.mapred.JobConf job,
org.apache.hadoop.mapred.Reporter reporter) |
org.apache.hadoop.mapred.InputSplit[] |
getSplits(org.apache.hadoop.mapred.JobConf job,
int numSplits) |
java.util.List<org.apache.hadoop.mapreduce.InputSplit> |
getSplits(org.apache.hadoop.mapreduce.JobContext context) |
protected boolean |
isOutputAsJson(org.apache.hadoop.conf.Configuration cfg) |
public java.util.List<org.apache.hadoop.mapreduce.InputSplit> getSplits(org.apache.hadoop.mapreduce.JobContext context) throws java.io.IOException
public EsInputFormat.EsInputRecordReader<K,V> createRecordReader(org.apache.hadoop.mapreduce.InputSplit split, org.apache.hadoop.mapreduce.TaskAttemptContext context)
public org.apache.hadoop.mapred.InputSplit[] getSplits(org.apache.hadoop.mapred.JobConf job, int numSplits) throws java.io.IOException
public EsInputFormat.EsInputRecordReader<K,V> getRecordReader(org.apache.hadoop.mapred.InputSplit split, org.apache.hadoop.mapred.JobConf job, org.apache.hadoop.mapred.Reporter reporter)
protected boolean isOutputAsJson(org.apache.hadoop.conf.Configuration cfg)