LOG.info("Going through each work and adding MultiMRInput"); mergeVx.addDataSource(mapWork.getName(), MultiMRInput.createConfigBuilder(conf, HiveInputFormat.class).build());
MultiMRInput.createConfigBuilder(conf, inputFormatClass).groupSplits(false).build(); } else { dataSource =
MultiMRInput.createConfigBuilder(conf, inputFormatClass).groupSplits(false).build(); } else { dataSource =
LOG.info("Going through each work and adding MultiMRInput"); mergeVx.addDataSource(mapWork.getName(), MultiMRInput.createConfigBuilder(conf, HiveInputFormat.class).build());
/** * Create an {@link MultiMRInputConfigBuilder} to configure a {@link MultiMRInput}</p> * The preferred usage model is to provide all of the parameters, and use methods to configure * the Input. * <p/> * For legacy applications, which may already have a fully configured {@link * org.apache.hadoop.conf.Configuration} * instance, the inputFormat can be specified as null * <p/> * Typically, this will be used along with a custom {@link org.apache.tez.dag.api.VertexManagerPlugin} * or {@link org.apache.tez.runtime.api.InputInitializer} to generate the multiple inputs to be * used by each task. If this is not setup, this will work the same as {@link * org.apache.tez.mapreduce.input.MRInput} </p> * Grouping of splits is disabled by default. * * @param conf Configuration for the {@link MRInput}. This configuration instance will be * modified in place * @param inputFormat InputFormat derived class. This can be null. If the InputFormat specified * is * null, the provided configuration should be complete. * @return {@link MultiMRInputConfigBuilder} */ public static MultiMRInputConfigBuilder createConfigBuilder(Configuration conf, @Nullable Class<?> inputFormat) { MultiMRInputConfigBuilder configBuilder = new MultiMRInputConfigBuilder(conf, inputFormat); configBuilder.setInputClassName(MultiMRInput.class.getName()).groupSplits(false); return configBuilder; }
MultiMRInput.createConfigBuilder(conf, inputFormatClass).groupSplits(false).build(); } else { dataSource =
LOG.info("Going through each work and adding MultiMRInput"); mergeVx.addDataSource(mapWork.getName(), MultiMRInput.createConfigBuilder(conf, HiveInputFormat.class).build());