@Internal public abstract class CsvInputFormat<OUT> extends GenericCsvInputFormat<OUT>
FileInputFormat.FileBaseStatistics, FileInputFormat.InputSplitOpenThread
Modifier and Type | Field and Description |
---|---|
static String |
DEFAULT_FIELD_DELIMITER |
static String |
DEFAULT_LINE_DELIMITER |
protected Object[] |
parsedValues |
commentCount, commentPrefix, fieldIncluded, invalidLineCount, lineDelimiterIsLinebreak
RECORD_DELIMITER
currentSplit, ENUMERATE_NESTED_FILES_FLAG, enumerateNestedFiles, filePath, INFLATER_INPUT_STREAM_FACTORIES, minSplitSize, numSplits, openTimeout, READ_WHOLE_SPLIT_FLAG, splitLength, splitStart, stream, unsplittable
Modifier | Constructor and Description |
---|---|
protected |
CsvInputFormat(Path filePath) |
Modifier and Type | Method and Description |
---|---|
protected static boolean[] |
createDefaultMask(int size) |
protected abstract OUT |
fillRecord(OUT reuse,
Object[] parsedValues) |
Class<?>[] |
getFieldTypes() |
OUT |
nextRecord(OUT record) |
void |
open(FileInputSplit split) |
OUT |
readRecord(OUT reuse,
byte[] bytes,
int offset,
int numBytes) |
protected static boolean[] |
toBooleanMask(int[] sourceFieldIndices) |
String |
toString() |
checkAndCoSort, checkForMonotonousOrder, close, enableQuotedStringParsing, getCommentPrefix, getFieldDelimiter, getFieldParsers, getGenericFieldTypes, getNumberOfFieldsTotal, getNumberOfNonNullFields, isLenient, isSkippingFirstLineAsHeader, parseRecord, setCommentPrefix, setCommentPrefix, setCommentPrefix, setCommentPrefix, setCommentPrefix, setFieldDelimiter, setFieldDelimiter, setFieldDelimiter, setFieldsGeneric, setFieldsGeneric, setFieldTypesGeneric, setLenient, setSkipFirstLineAsHeader, skipFields
configure, getBufferSize, getDelimiter, getLineLengthLimit, getNumLineSamples, getStatistics, loadGlobalConfigParams, reachedEnd, readLine, setBufferSize, setDelimiter, setDelimiter, setDelimiter, setLineLengthLimit, setNumLineSamples
acceptFile, createInputSplits, decorateInputStream, extractFileExtension, getFilePath, getFileStats, getInflaterInputStreamFactory, getInputSplitAssigner, getMinSplitSize, getNumSplits, getOpenTimeout, getSplitLength, getSplitStart, registerInflaterInputStreamFactory, setFilePath, setFilePath, setMinSplitSize, setNumSplits, setOpenTimeout, testForUnsplittable
getRuntimeContext, setRuntimeContext
public static final String DEFAULT_LINE_DELIMITER
public static final String DEFAULT_FIELD_DELIMITER
protected transient Object[] parsedValues
protected CsvInputFormat(Path filePath)
public void open(FileInputSplit split) throws IOException
open
in interface InputFormat<OUT,FileInputSplit>
open
in class GenericCsvInputFormat<OUT>
IOException
public OUT nextRecord(OUT record) throws IOException
nextRecord
in interface InputFormat<OUT,FileInputSplit>
nextRecord
in class DelimitedInputFormat<OUT>
IOException
public OUT readRecord(OUT reuse, byte[] bytes, int offset, int numBytes) throws IOException
readRecord
in class DelimitedInputFormat<OUT>
IOException
public Class<?>[] getFieldTypes()
protected static boolean[] createDefaultMask(int size)
protected static boolean[] toBooleanMask(int[] sourceFieldIndices)
public String toString()
toString
in class FileInputFormat<OUT>
Copyright © 2014–2016 The Apache Software Foundation. All rights reserved.