Class FileInputFormatCsv
java.lang.Object
org.apache.hadoop.mapreduce.InputFormat<K,V>
org.apache.hadoop.mapreduce.lib.input.FileInputFormat<org.apache.hadoop.io.LongWritable,List>
net.sansa_stack.hadoop.format.commons_csv.csv.FileInputFormatCsv
public class FileInputFormatCsv
extends org.apache.hadoop.mapreduce.lib.input.FileInputFormat<org.apache.hadoop.io.LongWritable,List>
-
Nested Class Summary
Nested classes/interfaces inherited from class org.apache.hadoop.mapreduce.lib.input.FileInputFormat
org.apache.hadoop.mapreduce.lib.input.FileInputFormat.Counter -
Field Summary
Fields inherited from class org.apache.hadoop.mapreduce.lib.input.FileInputFormat
DEFAULT_LIST_STATUS_NUM_THREADS, INPUT_DIR, INPUT_DIR_NONRECURSIVE_IGNORE_SUBDIRS, INPUT_DIR_RECURSIVE, LIST_STATUS_NUM_THREADS, NUM_INPUT_FILES, PATHFILTER_CLASS, SPLIT_MAXSIZE, SPLIT_MINSIZE -
Constructor Summary
Constructors -
Method Summary
Modifier and TypeMethodDescriptionorg.apache.hadoop.mapreduce.RecordReader<org.apache.hadoop.io.LongWritable,List> createRecordReader(org.apache.hadoop.mapreduce.InputSplit inputSplit, org.apache.hadoop.mapreduce.TaskAttemptContext context) static org.apache.commons.csv.CSVFormatgetCsvFormat(org.apache.hadoop.conf.Configuration conf, org.apache.commons.csv.CSVFormat defaultValue) booleanisSplitable(org.apache.hadoop.mapreduce.JobContext context, org.apache.hadoop.fs.Path file) static voidsetCsvFormat(org.apache.hadoop.conf.Configuration conf, org.apache.commons.csv.CSVFormat csvFormat) Methods inherited from class org.apache.hadoop.mapreduce.lib.input.FileInputFormat
addInputPath, addInputPathRecursively, addInputPaths, computeSplitSize, getBlockIndex, getFormatMinSplitSize, getInputDirRecursive, getInputPathFilter, getInputPaths, getMaxSplitSize, getMinSplitSize, getSplits, listStatus, makeSplit, makeSplit, setInputDirRecursive, setInputPathFilter, setInputPaths, setInputPaths, setMaxInputSplitSize, setMinInputSplitSize, shrinkStatus
-
Constructor Details
-
FileInputFormatCsv
public FileInputFormatCsv()
-
-
Method Details
-
isSplitable
public boolean isSplitable(org.apache.hadoop.mapreduce.JobContext context, org.apache.hadoop.fs.Path file) - Overrides:
isSplitablein classorg.apache.hadoop.mapreduce.lib.input.FileInputFormat<org.apache.hadoop.io.LongWritable,List>
-
createRecordReader
public org.apache.hadoop.mapreduce.RecordReader<org.apache.hadoop.io.LongWritable,List> createRecordReader(org.apache.hadoop.mapreduce.InputSplit inputSplit, org.apache.hadoop.mapreduce.TaskAttemptContext context) - Specified by:
createRecordReaderin classorg.apache.hadoop.mapreduce.InputFormat<org.apache.hadoop.io.LongWritable,List>
-
setCsvFormat
public static void setCsvFormat(org.apache.hadoop.conf.Configuration conf, org.apache.commons.csv.CSVFormat csvFormat) -
getCsvFormat
public static org.apache.commons.csv.CSVFormat getCsvFormat(org.apache.hadoop.conf.Configuration conf, org.apache.commons.csv.CSVFormat defaultValue)
-