public class CsvInputFormat<OUT> extends GenericCsvInputFormat<OUT>
DelimitedInputFormat.AbstractConfigBuilder<T>, DelimitedInputFormat.ConfigBuilder
FileInputFormat.FileBaseStatistics, FileInputFormat.InputSplitOpenThread
Modifier and Type | Field and Description |
---|---|
static String |
DEFAULT_FIELD_DELIMITER |
static String |
DEFAULT_LINE_DELIMITER |
commentCount, commentPrefix, fieldIncluded, invalidLineCount, lineDelimiterIsLinebreak
RECORD_DELIMITER
DEFLATE_SUFFIX, enumerateNestedFiles, filePath, minSplitSize, numSplits, openTimeout, READ_WHOLE_SPLIT_FLAG, splitLength, splitStart, stream, unsplittable
Constructor and Description |
---|
CsvInputFormat(Path filePath,
String lineDelimiter,
String fieldDelimiter,
TypeInformation<OUT> typeInformation) |
CsvInputFormat(Path filePath,
TypeInformation<OUT> typeInformation) |
Modifier and Type | Method and Description |
---|---|
Class<?>[] |
getFieldTypes() |
OUT |
nextRecord(OUT record) |
void |
open(FileInputSplit split) |
OUT |
readRecord(OUT reuse,
byte[] bytes,
int offset,
int numBytes) |
void |
setFields(boolean[] sourceFieldMask,
Class<?>[] fieldTypes) |
void |
setFields(int[] sourceFieldIndices,
Class<?>[] fieldTypes) |
void |
setFieldTypes(Class<?>... fieldTypes) |
void |
setOrderOfPOJOFields(String[] fieldsOrder) |
String |
toString() |
checkAndCoSort, checkForMonotonousOrder, close, enableQuotedStringParsing, getCommentPrefix, getFieldDelimiter, getFieldParsers, getGenericFieldTypes, getNumberOfFieldsTotal, getNumberOfNonNullFields, isLenient, isSkippingFirstLineAsHeader, parseRecord, setCommentPrefix, setCommentPrefix, setCommentPrefix, setCommentPrefix, setCommentPrefix, setFieldDelimiter, setFieldDelimiter, setFieldDelimiter, setFieldsGeneric, setFieldsGeneric, setFieldTypesGeneric, setLenient, setSkipFirstLineAsHeader, skipFields
configure, configureDelimitedFormat, getBufferSize, getDelimiter, getLineLengthLimit, getNumLineSamples, getStatistics, loadGloablConfigParams, reachedEnd, readLine, setBufferSize, setDelimiter, setDelimiter, setDelimiter, setLineLengthLimit, setNumLineSamples
acceptFile, configureFileFormat, createInputSplits, getFilePath, getFileStats, getInputSplitAssigner, getMinSplitSize, getNumSplits, getOpenTimeout, getSplitLength, getSplitStart, setFilePath, setFilePath, setMinSplitSize, setNumSplits, setOpenTimeout, testForUnsplittable
public static final String DEFAULT_LINE_DELIMITER
public static final String DEFAULT_FIELD_DELIMITER
public CsvInputFormat(Path filePath, TypeInformation<OUT> typeInformation)
public CsvInputFormat(Path filePath, String lineDelimiter, String fieldDelimiter, TypeInformation<OUT> typeInformation)
public void setOrderOfPOJOFields(String[] fieldsOrder)
public void setFieldTypes(Class<?>... fieldTypes)
public void setFields(int[] sourceFieldIndices, Class<?>[] fieldTypes)
public void setFields(boolean[] sourceFieldMask, Class<?>[] fieldTypes)
public Class<?>[] getFieldTypes()
public void open(FileInputSplit split) throws IOException
open
in interface InputFormat<OUT,FileInputSplit>
open
in class GenericCsvInputFormat<OUT>
IOException
public OUT nextRecord(OUT record) throws IOException
nextRecord
in interface InputFormat<OUT,FileInputSplit>
nextRecord
in class DelimitedInputFormat<OUT>
IOException
public OUT readRecord(OUT reuse, byte[] bytes, int offset, int numBytes) throws IOException
readRecord
in class DelimitedInputFormat<OUT>
IOException
public String toString()
toString
in class FileInputFormat<OUT>
Copyright © 2014–2015 The Apache Software Foundation. All rights reserved.