public final class InputSplitUtils extends Object
| Modifier and Type | Method and Description |
|---|---|
static String |
expandInputFolder(org.apache.hadoop.conf.Configuration conf)
Expand folder to all files to support all files in that folder
|
static int |
getBlockIndex(org.apache.hadoop.fs.BlockLocation[] blkLocations,
long offset) |
static List<List<org.apache.hadoop.mapreduce.InputSplit>> |
getCombineGuaguaSplits(List<org.apache.hadoop.mapreduce.InputSplit> oneInputSplits,
long maxCombinedSplitSize) |
static List<org.apache.hadoop.mapreduce.InputSplit> |
getFileSplits(org.apache.hadoop.conf.Configuration conf,
long splitSize)
Generate the list of files and make them into FileSplits.
|
static List<org.apache.hadoop.mapreduce.InputSplit> |
getFinalCombineGuaguaSplits(List<org.apache.hadoop.mapreduce.InputSplit> newSplits,
long combineSize)
Copy from pig implementation, need to check this code logic.
|
static List<org.apache.hadoop.mapreduce.InputSplit> |
getGuaguaSplits(org.apache.hadoop.conf.Configuration conf,
long splitSize)
Generate the list of files and make them into FileSplits.
|
static org.apache.hadoop.fs.FileStatus[] |
listStatus(org.apache.hadoop.conf.Configuration conf)
List all the inputs files.
|
public static List<org.apache.hadoop.mapreduce.InputSplit> getFinalCombineGuaguaSplits(List<org.apache.hadoop.mapreduce.InputSplit> newSplits, long combineSize) throws IOException
IOExceptionpublic static org.apache.hadoop.fs.FileStatus[] listStatus(org.apache.hadoop.conf.Configuration conf)
throws IOException
IOExceptionpublic static String expandInputFolder(org.apache.hadoop.conf.Configuration conf) throws IOException
IOExceptionpublic static List<org.apache.hadoop.mapreduce.InputSplit> getFileSplits(org.apache.hadoop.conf.Configuration conf, long splitSize) throws IOException
IOExceptionpublic static List<org.apache.hadoop.mapreduce.InputSplit> getGuaguaSplits(org.apache.hadoop.conf.Configuration conf, long splitSize) throws IOException
IOExceptionpublic static int getBlockIndex(org.apache.hadoop.fs.BlockLocation[] blkLocations,
long offset)
public static List<List<org.apache.hadoop.mapreduce.InputSplit>> getCombineGuaguaSplits(List<org.apache.hadoop.mapreduce.InputSplit> oneInputSplits, long maxCombinedSplitSize) throws IOException, InterruptedException
IOExceptionInterruptedExceptionCopyright © 2015. All Rights Reserved.