org.apache.hadoop.mapreduce.task.JobContextImpl java code examples

@Override
public JobContext createJobContext(Configuration conf,
                  JobID jobId) {
 return new JobContextImpl(conf instanceof JobConf? new JobConf(conf) : conf,
     jobId);
}

/**
 * Get the timestamps of the archives.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getArchiveTimestamps() {
 return toTimestampStrs(DistributedCache.getArchiveTimestamps(conf));
}

/**
 * The user-specified job name.
 */
public String getJobName() {
 if (state == JobState.DEFINE) {
  return super.getJobName();
 }
 ensureState(JobState.RUNNING);
 return status.getJobName();
}

/**
 * Get the timestamps of the archives.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getArchiveTimestamps() {
 return toTimestampStrs(DistributedCache.getArchiveTimestamps(conf));
}

/**
 * The user-specified job name.
 */
public String getJobName() {
 if (state == JobState.DEFINE) {
  return super.getJobName();
 }
 ensureState(JobState.RUNNING);
 return status.getJobName();
}

@Override
public org.apache.hadoop.mapreduce.JobContext newJobContext(Job job) {
 return new JobContextImpl(job.getConfiguration(), job.getJobID());
}

/**
 * Get the timestamps of the files.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getFileTimestamps() {
 return toTimestampStrs(DistributedCache.getFileTimestamps(conf));
}

/**
 * The user-specified job name.
 */
public String getJobName() {
 if (state == JobState.DEFINE) {
  return super.getJobName();
 }
 ensureState(JobState.RUNNING);
 return status.getJobName();
}

@Override
public BaseStatistics getStatistics(BaseStatistics cachedStats) throws IOException {
  // only gather base statistics for FileInputFormats
  if (!(mapreduceInputFormat instanceof FileInputFormat)) {
    return null;
  }
  JobContext jobContext = new JobContextImpl(configuration, null);
  final FileBaseStatistics cachedFileStats = (cachedStats instanceof FileBaseStatistics) ?
      (FileBaseStatistics) cachedStats : null;
  try {
    final org.apache.hadoop.fs.Path[] paths = FileInputFormat.getInputPaths(jobContext);
    return getFileStats(cachedFileStats, paths, new ArrayList<FileStatus>(1));
  } catch (IOException ioex) {
    if (LOG.isWarnEnabled()) {
      LOG.warn("Could not determine statistics due to an io error: "
          + ioex.getMessage());
    }
  } catch (Throwable t) {
    if (LOG.isErrorEnabled()) {
      LOG.error("Unexpected problem while getting the file statistics: "
          + t.getMessage(), t);
    }
  }
  // no statistics available
  return null;
}

/**
 * Get the timestamps of the archives.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getArchiveTimestamps() {
 return toTimestampStrs(DistributedCache.getArchiveTimestamps(conf));
}

/**
 * The user-specified job name.
 */
public String getJobName() {
 if (state == JobState.DEFINE) {
  return super.getJobName();
 }
 ensureState(JobState.RUNNING);
 return status.getJobName();
}

@Override
public HadoopInputSplit[] createInputSplits(int minNumSplits)
    throws IOException {
  configuration.setInt("mapreduce.input.fileinputformat.split.minsize", minNumSplits);
  JobContext jobContext = new JobContextImpl(configuration, new JobID());
  List<InputSplit> splits;
  try {
    splits = this.hCatInputFormat.getSplits(jobContext);
  } catch (InterruptedException e) {
    throw new IOException("Could not get Splits.", e);
  }
  HadoopInputSplit[] hadoopInputSplits = new HadoopInputSplit[splits.size()];
  for (int i = 0; i < hadoopInputSplits.length; i++){
    hadoopInputSplits[i] = new HadoopInputSplit(i, splits.get(i), jobContext);
  }
  return hadoopInputSplits;
}

/**
 * Get the timestamps of the files.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getFileTimestamps() {
 return toTimestampStrs(DistributedCache.getFileTimestamps(conf));
}

/**
 * The user-specified job name.
 */
public String getJobName() {
 if (state == JobState.DEFINE) {
  return super.getJobName();
 }
 ensureState(JobState.RUNNING);
 return status.getJobName();
}

@Override
public HadoopInputSplit[] createInputSplits(int minNumSplits)
    throws IOException {
  configuration.setInt("mapreduce.input.fileinputformat.split.minsize", minNumSplits);
  JobContext jobContext = new JobContextImpl(configuration, new JobID());
  jobContext.getCredentials().addAll(this.credentials);
  Credentials currentUserCreds = getCredentialsFromUGI(UserGroupInformation.getCurrentUser());
  if (currentUserCreds != null) {
    jobContext.getCredentials().addAll(currentUserCreds);
  }
  List<org.apache.hadoop.mapreduce.InputSplit> splits;
  try {
    splits = this.mapreduceInputFormat.getSplits(jobContext);
  } catch (InterruptedException e) {
    throw new IOException("Could not get Splits.", e);
  }
  HadoopInputSplit[] hadoopInputSplits = new HadoopInputSplit[splits.size()];
  for (int i = 0; i < hadoopInputSplits.length; i++) {
    hadoopInputSplits[i] = new HadoopInputSplit(i, splits.get(i), jobContext);
  }
  return hadoopInputSplits;
}

/**
 * Get the timestamps of the files.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getFileTimestamps() {
 return toTimestampStrs(DistributedCache.getFileTimestamps(conf));
}

  this.context = new TaskAttemptContextImpl(this.configuration, taskAttemptID);
  this.outputCommitter = this.mapreduceOutputFormat.getOutputCommitter(this.context);
  this.outputCommitter.setupJob(new JobContextImpl(this.configuration, new JobID()));
} catch (Exception e) {
  throw new RuntimeException(e);

/**
 * Get the timestamps of the archives.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getArchiveTimestamps() {
 return toTimestampStrs(DistributedCache.getArchiveTimestamps(conf));
}

@Override
public void finalizeGlobal(int parallelism) throws IOException {
  JobContext jobContext;
  TaskAttemptContext taskContext;
  try {
    TaskAttemptID taskAttemptID = TaskAttemptID.forName("attempt__0000_r_"
        + String.format("%" + (6 - Integer.toString(1).length()) + "s", " ").replace(" ", "0")
        + Integer.toString(1)
        + "_0");
    jobContext = new JobContextImpl(this.configuration, new JobID());
    taskContext = new TaskAttemptContextImpl(this.configuration, taskAttemptID);
    this.outputCommitter = this.mapreduceOutputFormat.getOutputCommitter(taskContext);
  } catch (Exception e) {
    throw new RuntimeException(e);
  }
  jobContext.getCredentials().addAll(this.credentials);
  Credentials currentUserCreds = getCredentialsFromUGI(UserGroupInformation.getCurrentUser());
  if (currentUserCreds != null) {
    jobContext.getCredentials().addAll(currentUserCreds);
  }
  // finalize HDFS output format
  if (this.outputCommitter != null) {
    this.outputCommitter.commitJob(jobContext);
  }
}

/**
 * Get the timestamps of the files.  Used by internal
 * DistributedCache and MapReduce code.
 * @return a string array of timestamps 
 */
public String[] getFileTimestamps() {
 return toTimestampStrs(DistributedCache.getFileTimestamps(conf));
}

Javadoc

A read-only view of the job that is provided to the tasks while they are running.

Most used methods

<init>
getJobName
Get the user-specified job name. This is only used to identify the job to the user.
toTimestampStrs
Parse a list of longs into strings.

Popular in Java

Parsing JSON documents to java classes using gson
requestLocationUpdates (LocationManager)
putExtra (Intent)
getContentResolver (Context)
InputStream (java.io)
A readable source of bytes.Most clients will use input streams that read data from the file system (
Enumeration (java.util)
A legacy iteration interface.New code should use Iterator instead. Iterator replaces the enumeration
ThreadPoolExecutor (java.util.concurrent)
An ExecutorService that executes each submitted task using one of possibly several pooled threads, n
Pattern (java.util.regex)
Patterns are compiled regular expressions. In many cases, convenience methods such as String#matches
Base64 (org.apache.commons.codec.binary)
Provides Base64 encoding and decoding as defined by RFC 2045.This class implements section 6.8. Base
FlowLayout (java.awt)
A flow layout arranges components in a left-to-right flow, much like lines of text in a paragraph. F
Best IntelliJ plugins

How to useJobContextImpl in org.apache.hadoop.mapreduce.task

Best Java code snippets using org.apache.hadoop.mapreduce.task.JobContextImpl (Showing top 20 results out of 315)

How to use
JobContextImpl
in
org.apache.hadoop.mapreduce.task