org.apache.hadoop.mapreduce.lib.input.NLineInputFormat.getSplitsForFile java code examples

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)
 */
public InputSplit[] getSplits(JobConf job, int numSplits)
throws IOException {
 ArrayList<FileSplit> splits = new ArrayList<FileSplit>();
 for (FileStatus status : listStatus(job)) {
  for (org.apache.hadoop.mapreduce.lib.input.FileSplit split : 
    org.apache.hadoop.mapreduce.lib.input.
    NLineInputFormat.getSplitsForFile(status, job, N)) {
   splits.add(new FileSplit(split));
  }
 }
 return splits.toArray(new FileSplit[splits.size()]);
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see FileInputFormat#getSplits(JobContext)
 */
public List<InputSplit> getSplits(JobContext job)
throws IOException {
 List<InputSplit> splits = new ArrayList<InputSplit>();
 int numLinesPerSplit = getNumLinesPerSplit(job);
 for (FileStatus status : listStatus(job)) {
  splits.addAll(getSplitsForFile(status,
   job.getConfiguration(), numLinesPerSplit));
 }
 return splits;
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)
 */
public InputSplit[] getSplits(JobConf job, int numSplits)
throws IOException {
 ArrayList<FileSplit> splits = new ArrayList<FileSplit>();
 for (FileStatus status : listStatus(job)) {
  for (org.apache.hadoop.mapreduce.lib.input.FileSplit split : 
    org.apache.hadoop.mapreduce.lib.input.
    NLineInputFormat.getSplitsForFile(status, job, N)) {
   splits.add(new FileSplit(split));
  }
 }
 return splits.toArray(new FileSplit[splits.size()]);
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see FileInputFormat#getSplits(JobContext)
 */
public List<InputSplit> getSplits(JobContext job)
throws IOException {
 List<InputSplit> splits = new ArrayList<InputSplit>();
 int numLinesPerSplit = getNumLinesPerSplit(job);
 for (FileStatus status : listStatus(job)) {
  splits.addAll(getSplitsForFile(status,
   job.getConfiguration(), numLinesPerSplit));
 }
 return splits;
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see FileInputFormat#getSplits(JobContext)
 */
public List<InputSplit> getSplits(JobContext job)
throws IOException {
 List<InputSplit> splits = new ArrayList<InputSplit>();
 int numLinesPerSplit = getNumLinesPerSplit(job);
 for (FileStatus status : listStatus(job)) {
  splits.addAll(getSplitsForFile(status,
   job.getConfiguration(), numLinesPerSplit));
 }
 return splits;
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)
 */
public InputSplit[] getSplits(JobConf job, int numSplits)
throws IOException {
 ArrayList<FileSplit> splits = new ArrayList<FileSplit>();
 for (FileStatus status : listStatus(job)) {
  for (org.apache.hadoop.mapreduce.lib.input.FileSplit split : 
    org.apache.hadoop.mapreduce.lib.input.
    NLineInputFormat.getSplitsForFile(status, job, N)) {
   splits.add(new FileSplit(split));
  }
 }
 return splits.toArray(new FileSplit[splits.size()]);
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see FileInputFormat#getSplits(JobContext)
 */
public List<InputSplit> getSplits(JobContext job)
throws IOException {
 List<InputSplit> splits = new ArrayList<InputSplit>();
 int numLinesPerSplit = getNumLinesPerSplit(job);
 for (FileStatus status : listStatus(job)) {
  splits.addAll(getSplitsForFile(status,
   job.getConfiguration(), numLinesPerSplit));
 }
 return splits;
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see FileInputFormat#getSplits(JobContext)
 */
public List<InputSplit> getSplits(JobContext job)
throws IOException {
 List<InputSplit> splits = new ArrayList<InputSplit>();
 int numLinesPerSplit = getNumLinesPerSplit(job);
 for (FileStatus status : listStatus(job)) {
  splits.addAll(getSplitsForFile(status,
   job.getConfiguration(), numLinesPerSplit));
 }
 return splits;
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)
 */
public InputSplit[] getSplits(JobConf job, int numSplits)
throws IOException {
 ArrayList<FileSplit> splits = new ArrayList<FileSplit>();
 for (FileStatus status : listStatus(job)) {
  for (org.apache.hadoop.mapreduce.lib.input.FileSplit split : 
    org.apache.hadoop.mapreduce.lib.input.
    NLineInputFormat.getSplitsForFile(status, job, N)) {
   splits.add(new FileSplit(split));
  }
 }
 return splits.toArray(new FileSplit[splits.size()]);
}

/** 
 * Logically splits the set of input files for the job, splits N lines
 * of the input as one split.
 * 
 * @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)
 */
public InputSplit[] getSplits(JobConf job, int numSplits)
throws IOException {
 ArrayList<FileSplit> splits = new ArrayList<FileSplit>();
 for (FileStatus status : listStatus(job)) {
  for (org.apache.hadoop.mapreduce.lib.input.FileSplit split : 
    org.apache.hadoop.mapreduce.lib.input.
    NLineInputFormat.getSplitsForFile(status, job, N)) {
   splits.add(new FileSplit(split));
  }
 }
 return splits.toArray(new FileSplit[splits.size()]);
}

  /**
   * Logically splits the set of input files for the job, splits N lines of
   * the input as one split.
   * 
   * @see FileInputFormat#getSplits(JobContext)
   */
  @Override
  public final List<InputSplit> getSplits(JobContext job) throws IOException {
    boolean debug = LOGGER.isDebugEnabled();
    if (debug && FileInputFormat.getInputDirRecursive(job)) {
      LOGGER.debug("Recursive searching for input data is enabled");
    }
    
    List<InputSplit> splits = new ArrayList<InputSplit>();
    int numLinesPerSplit = NLineInputFormat.getNumLinesPerSplit(job);
    for (FileStatus status : listStatus(job)) {
      if (debug) {
        LOGGER.debug("Determining how to split input file/directory {}", status.getPath());
      }
      splits.addAll(NLineInputFormat.getSplitsForFile(status, job.getConfiguration(), numLinesPerSplit));
    }
    return splits;
  }
}

  /**
   * Logically splits the set of input files for the job, splits N lines of
   * the input as one split.
   * 
   * @see FileInputFormat#getSplits(JobContext)
   */
  @Override
  public final List<InputSplit> getSplits(JobContext job) throws IOException {
    boolean debug = LOGGER.isDebugEnabled();
    if (debug && FileInputFormat.getInputDirRecursive(job)) {
      LOGGER.debug("Recursive searching for input data is enabled");
    }
    
    List<InputSplit> splits = new ArrayList<InputSplit>();
    int numLinesPerSplit = NLineInputFormat.getNumLinesPerSplit(job);
    for (FileStatus status : listStatus(job)) {
      if (debug) {
        LOGGER.debug("Determining how to split input file/directory {}", status.getPath());
      }
      splits.addAll(NLineInputFormat.getSplitsForFile(status, job.getConfiguration(), numLinesPerSplit));
    }
    return splits;
  }
}

Popular methods of NLineInputFormat

setNumLinesPerSplit
Set the number of lines per split
getNumLinesPerSplit
Get the number of lines per split
listStatus
addInputPath
createFileSplit
NLineInputFormat uses LineRecordReader, which always reads (and consumes) at least one character out
<init>
createRecordReader
getSplits
Logically splits the set of input files for the job, splits N lines of the input as one split.
setInputPaths

Popular in Java

Reactive rest calls using spring rest template
onRequestPermissionsResult (Fragment)
addToBackStack (FragmentTransaction)
getSharedPreferences (Context)
Proxy (java.net)
This class represents proxy server settings. A created instance of Proxy stores a type and an addres
Manifest (java.util.jar)
The Manifest class is used to obtain attribute information for a JarFile and its entries.
GridLayout (java.awt)
The GridLayout class is a layout manager that lays out a container's components in a rectangular gri
BufferedImage (java.awt.image)
The BufferedImage subclass describes an java.awt.Image with an accessible buffer of image data. All
JPanel (javax.swing)
Option (scala)
From CI to AI: The AI layer in your organization

How to use getSplitsForFilemethodin org.apache.hadoop.mapreduce.lib.input.NLineInputFormat

Best Java code snippets using org.apache.hadoop.mapreduce.lib.input.NLineInputFormat.getSplitsForFile (Showing top 12 results out of 315)

How to use
getSplitsForFile
method
in
org.apache.hadoop.mapreduce.lib.input.NLineInputFormat