org.apache.hadoop.mapred.JobConf.getNumReduceTasks java code examples

public void configure(JobConf conf) {
 this.conf = conf;
 this.isMapOnly = conf.getNumReduceTasks() == 0;
}

@Override @SuppressWarnings("unchecked")
public void configure(JobConf conf) {
 this.mapper =
  ReflectionUtils.newInstance
  (conf.getClass(AvroJob.MAPPER, AvroMapper.class, AvroMapper.class),
   conf);
 this.isMapOnly = conf.getNumReduceTasks() == 0;
}

/**
 * Ensures that the given number of reduce tasks for the given job
 * configuration does not exceed the number of regions for the given table.
 *
 * @param table  The table to get the region count for.
 * @param job  The current job configuration to adjust.
 * @throws IOException When retrieving the table details fails.
 */
// Used by tests.
public static void limitNumReduceTasks(String table, JobConf job)
throws IOException {
 int regions =
  MetaTableAccessor.getRegionCount(HBaseConfiguration.create(job), TableName.valueOf(table));
 if (job.getNumReduceTasks() > regions)
  job.setNumReduceTasks(regions);
}

public void writePartitionKeys(Path path, JobConf job) throws IOException {
 byte[][] partitionKeys = getPartitionKeys(job.getNumReduceTasks());
 int numPartition = partitionKeys.length + 1;
 if (numPartition != job.getNumReduceTasks()) {
  job.setNumReduceTasks(numPartition);
 }
 FileSystem fs = path.getFileSystem(job);
 SequenceFile.Writer writer = SequenceFile.createWriter(fs, job, path,
   BytesWritable.class, NullWritable.class);
 try {
  for (byte[] pkey : partitionKeys) {
   BytesWritable wrapper = new BytesWritable(pkey);
   writer.append(wrapper, NullWritable.get());
  }
 } finally {
  IOUtils.closeStream(writer);
 }
}

public void writePartitionKeys(Path path, JobConf job) throws IOException {
 byte[][] partitionKeys = getPartitionKeys(job.getNumReduceTasks());
 int numPartition = partitionKeys.length + 1;
 if (numPartition != job.getNumReduceTasks()) {
  job.setNumReduceTasks(numPartition);
 }
 FileSystem fs = path.getFileSystem(job);
 SequenceFile.Writer writer = SequenceFile.createWriter(fs, job, path,
   BytesWritable.class, NullWritable.class);
 try {
  for (byte[] pkey : partitionKeys) {
   BytesWritable wrapper = new BytesWritable(pkey);
   writer.append(wrapper, NullWritable.get());
  }
 } finally {
  IOUtils.closeStream(writer);
 }
}

/**
 * Adds a named output for the job.
 * <p/>
 *
 * @param conf              job conf to add the named output
 * @param namedOutput       named output name, it has to be a word, letters
 *                          and numbers only, cannot be the word 'part' as
 *                          that is reserved for the
 *                          default output.
 * @param multi             indicates if the named output is multi
 * @param outputFormatClass OutputFormat class.
 * @param schema            Schema to used for this namedOutput
 */
private static void addNamedOutput(JobConf conf, String namedOutput,
               boolean multi,
               Class<? extends OutputFormat> outputFormatClass,
               Schema schema) {
 checkNamedOutputName(namedOutput);
 checkNamedOutput(conf, namedOutput, true);
 boolean isMapOnly = conf.getNumReduceTasks() == 0;
 if(schema!=null)
  conf.set(MO_PREFIX+namedOutput+".schema", schema.toString());
 conf.set(NAMED_OUTPUTS, conf.get(NAMED_OUTPUTS, "") + " " + namedOutput);
 conf.setClass(MO_PREFIX + namedOutput + FORMAT, outputFormatClass,
  OutputFormat.class);
 conf.setBoolean(MO_PREFIX + namedOutput + MULTI, multi);
}

int regions =
 MetaTableAccessor.getRegionCount(HBaseConfiguration.create(job), TableName.valueOf(table));
if (job.getNumReduceTasks() > regions) {
 job.setNumReduceTasks(regions);

 @SuppressWarnings({"unchecked", "deprecation"})
 public RecordWriter<Object, Object> getRecordWriter(FileSystem fs,JobConf job, String baseFileName, Progressable arg3) throws IOException {
 String nameOutput = job.get(CONFIG_NAMED_OUTPUT, null);
 String fileName = getUniqueName(job, baseFileName);
 Schema schema = null;
 String schemastr = job.get(MO_PREFIX+nameOutput+".schema",null);
 if (schemastr!=null)
  schema = Schema.parse(schemastr);
 JobConf outputConf = new JobConf(job);
 outputConf.setOutputFormat(getNamedOutputFormatClass(job, nameOutput));
 boolean isMapOnly = job.getNumReduceTasks() == 0;
 if (schema != null) {
  if (isMapOnly)
   AvroJob.setMapOutputSchema(outputConf, schema);
  else
   AvroJob.setOutputSchema(outputConf, schema);
 }
 OutputFormat outputFormat = outputConf.getOutputFormat();
 return outputFormat.getRecordWriter(fs, outputConf, fileName, arg3);
 }
}

throws IOException {
boolean isMapOnly = job.getNumReduceTasks() == 0;
final Schema schema = isMapOnly
 ? AvroJob.getMapOutputSchema(job)

@Override
public RecordWriter<AvroWrapper<T>, NullWritable>
 getRecordWriter(FileSystem ignore, JobConf job,
         String name, Progressable prog)
 throws IOException {
 boolean isMapOnly = job.getNumReduceTasks() == 0;
 Schema schema = isMapOnly
  ? AvroJob.getMapOutputSchema(job)
  : AvroJob.getOutputSchema(job);
 GenericData dataModel = AvroJob.createDataModel(job);
 final DataFileWriter<T> writer =
  new DataFileWriter<T>(dataModel.createDatumWriter(null));
 configureDataFileWriter(writer, job);
 Path path = FileOutputFormat.getTaskOutputPath(job, name+EXT);
 writer.create(schema, path.getFileSystem(job).create(path));
 return new RecordWriter<AvroWrapper<T>, NullWritable>() {
   public void write(AvroWrapper<T> wrapper, NullWritable ignore)
    throws IOException {
    writer.append(wrapper.datum());
   }
   public void close(Reporter reporter) throws IOException {
    writer.close();
   }
  };
}

process.inputClient.partitions(job.getNumReduceTasks());

    || jobConf.get(MRJobConfig.COMBINE_CLASS_ATTR) != null;
int numReduces = jobConf.getNumReduceTasks();

boolean isMapOnly = ((JobConf)getConf()).getNumReduceTasks() == 0;
if (AvroKey.class.isAssignableFrom(inputClass)) {
 Schema schema;

/**
 * Check what the given number of reduce tasks for the given job configuration
 * does not exceed the number of regions for the given table.
 */
@Test
public void shouldNumberOfReduceTaskNotExceedNumberOfRegionsForGivenTable()
  throws IOException {
 Assert.assertNotNull(presidentsTable);
 Configuration cfg = UTIL.getConfiguration();
 JobConf jobConf = new JobConf(cfg);
 TableMapReduceUtil.setNumReduceTasks(TABLE_NAME, jobConf);
 TableMapReduceUtil.limitNumReduceTasks(TABLE_NAME, jobConf);
 TableMapReduceUtil.setScannerCaching(jobConf, 100);
 assertEquals(1, jobConf.getNumReduceTasks());
 assertEquals(100, jobConf.getInt("hbase.client.scanner.caching", 0));
 jobConf.setNumReduceTasks(10);
 TableMapReduceUtil.setNumMapTasks(TABLE_NAME, jobConf);
 TableMapReduceUtil.limitNumReduceTasks(TABLE_NAME, jobConf);
 assertEquals(1, jobConf.getNumReduceTasks());
}

public void configure(JobConf job) {
  number_nodes = Long.parseLong(job.get("number_nodes"));
  //nreducers = Integer.parseInt(job.get("nreducers"));
  nreducers = job.getNumReduceTasks();
  System.out.println("MapHistogram configure(): number_nodes = " + number_nodes + ", nreducers=" + nreducers);
}

if (mWork.getSamplingType() > 0 && rWork != null && job.getNumReduceTasks() > 1) {
 try {
  handleSampling(ctx, mWork, job);

 console.printInfo("Number of reduce tasks determined at compile time: "
   + rWork.getNumReduceTasks());
} else if (job.getNumReduceTasks() > 0) {
 int reducers = job.getNumReduceTasks();
 rWork.setNumReduceTasks(reducers);
 console

 console.printInfo("Number of reduce tasks determined at compile time: "
   + rWork.getNumReduceTasks());
} else if (job.getNumReduceTasks() > 0) {
 int reducers = job.getNumReduceTasks();
 rWork.setNumReduceTasks(reducers);
 console

if (mWork.getSamplingType() > 0 && rWork != null && job.getNumReduceTasks() > 1) {
 try {
  handleSampling(ctx, mWork, job);

@Test
@SuppressWarnings({ "deprecation" })
public void shouldCreateAndRunSubmittableJob() throws Exception {
 RowCounter rCounter = new RowCounter();
 rCounter.setConf(HBaseConfiguration.create());
 String[] args = new String[] { "\temp", "tableA", "column1", "column2",
   "column3" };
 JobConf jobConfig = rCounter.createSubmittableJob(args);
 assertNotNull(jobConfig);
 assertEquals(0, jobConfig.getNumReduceTasks());
 assertEquals("rowcounter", jobConfig.getJobName());
 assertEquals(jobConfig.getMapOutputValueClass(), Result.class);
 assertEquals(jobConfig.getMapperClass(), RowCounterMapper.class);
 assertEquals(jobConfig.get(TableInputFormat.COLUMN_LIST), Joiner.on(' ')
   .join("column1", "column2", "column3"));
 assertEquals(jobConfig.getMapOutputKeyClass(), ImmutableBytesWritable.class);
}

Javadoc

Get configured the number of reduce tasks for this job. Defaults to 1.

Popular methods of JobConf

<init>
A new map/reduce configuration where the behavior of reading from the default resources can be turne
set
get
setInputFormat
Set the InputFormat implementation for the map-reduce job.
setOutputFormat
Set the OutputFormat implementation for the map-reduce job.
getInt
setMapperClass
Set the Mapper class for the job.
setOutputKeyClass
Set the key class for the job output data.
setOutputValueClass
Set the value class for job outputs.
setReducerClass
Set the Reducer class for the job.
setNumReduceTasks
Set the requisite number of reduce tasks for this job.HOW MANY REDUCES? The right number of reduces
setBoolean

Popular in Java

Start an intent from android
getSupportFragmentManager (FragmentActivity)
setRequestProperty (URLConnection)
compareTo (BigDecimal)
SocketException (java.net)
This SocketException may be thrown during socket creation or setting options, and is the superclass
SocketTimeoutException (java.net)
This exception is thrown when a timeout expired on a socket read or accept operation.
LoggerFactory (org.slf4j)
The LoggerFactory is a utility class producing Loggers for various logging APIs, most notably for lo
Reference (javax.naming)
JTextField (javax.swing)
Get (org.apache.hadoop.hbase.client)
Used to perform Get operations on a single row. To get everything for a row, instantiate a Get objec
From CI to AI: The AI layer in your organization

How to use getNumReduceTasksmethodin org.apache.hadoop.mapred.JobConf

Best Java code snippets using org.apache.hadoop.mapred.JobConf.getNumReduceTasks (Showing top 20 results out of 414)

How to use
getNumReduceTasks
method
in
org.apache.hadoop.mapred.JobConf