public static void main(String[] args) throws Exception { ToolRunner.run(new DatasetSplitter(), args); }
addInputOption(); addOutputOption(); addOption("trainingPercentage", "t", "percentage of the data to use as training set (default: " + DEFAULT_TRAINING_PERCENTAGE + ')', String.valueOf(DEFAULT_TRAINING_PERCENTAGE)); addOption("probePercentage", "p", "percentage of the data to use as probe set (default: " + DEFAULT_PROBE_PERCENTAGE + ')', String.valueOf(DEFAULT_PROBE_PERCENTAGE)); Map<String,List<String>> parsedArgs = parseArguments(args); if (parsedArgs == null) { return -1; double trainingPercentage = Double.parseDouble(getOption("trainingPercentage")); double probePercentage = Double.parseDouble(getOption("probePercentage")); String tempDir = getOption("tempDir"); Path trainingSetPath = new Path(getOutputPath(), "trainingSet"); Path probeSetPath = new Path(getOutputPath(), "probeSet"); Job markPreferences = prepareJob(getInputPath(), markedPrefs, TextInputFormat.class, MarkPreferencesMapper.class, Text.class, Text.class, SequenceFileOutputFormat.class); markPreferences.getConfiguration().set(TRAINING_PERCENTAGE, String.valueOf(trainingPercentage)); Job createTrainingSet = prepareJob(markedPrefs, trainingSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createTrainingSet.getConfiguration().set(PART_TO_USE, INTO_TRAINING_SET.toString()); Job createProbeSet = prepareJob(markedPrefs, probeSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createProbeSet.getConfiguration().set(PART_TO_USE, INTO_PROBE_SET.toString());
addInputOption(); addOutputOption(); addOption("trainingPercentage", "t", "percentage of the data to use as training set (default: " + DEFAULT_TRAINING_PERCENTAGE + ')', String.valueOf(DEFAULT_TRAINING_PERCENTAGE)); addOption("probePercentage", "p", "percentage of the data to use as probe set (default: " + DEFAULT_PROBE_PERCENTAGE + ')', String.valueOf(DEFAULT_PROBE_PERCENTAGE)); Map<String,List<String>> parsedArgs = parseArguments(args); if (parsedArgs == null) { return -1; double trainingPercentage = Double.parseDouble(getOption("trainingPercentage")); double probePercentage = Double.parseDouble(getOption("probePercentage")); String tempDir = getOption("tempDir"); Path trainingSetPath = new Path(getOutputPath(), "trainingSet"); Path probeSetPath = new Path(getOutputPath(), "probeSet"); Job markPreferences = prepareJob(getInputPath(), markedPrefs, TextInputFormat.class, MarkPreferencesMapper.class, Text.class, Text.class, SequenceFileOutputFormat.class); markPreferences.getConfiguration().set(TRAINING_PERCENTAGE, String.valueOf(trainingPercentage)); Job createTrainingSet = prepareJob(markedPrefs, trainingSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createTrainingSet.getConfiguration().set(PART_TO_USE, INTO_TRAINING_SET.toString()); Job createProbeSet = prepareJob(markedPrefs, probeSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createProbeSet.getConfiguration().set(PART_TO_USE, INTO_PROBE_SET.toString());
addInputOption(); addOutputOption(); addOption("trainingPercentage", "t", "percentage of the data to use as training set (default: " + DEFAULT_TRAINING_PERCENTAGE + ')', String.valueOf(DEFAULT_TRAINING_PERCENTAGE)); addOption("probePercentage", "p", "percentage of the data to use as probe set (default: " + DEFAULT_PROBE_PERCENTAGE + ')', String.valueOf(DEFAULT_PROBE_PERCENTAGE)); Map<String,List<String>> parsedArgs = parseArguments(args); if (parsedArgs == null) { return -1; double trainingPercentage = Double.parseDouble(getOption("trainingPercentage")); double probePercentage = Double.parseDouble(getOption("probePercentage")); String tempDir = getOption("tempDir"); Path trainingSetPath = new Path(getOutputPath(), "trainingSet"); Path probeSetPath = new Path(getOutputPath(), "probeSet"); Job markPreferences = prepareJob(getInputPath(), markedPrefs, TextInputFormat.class, MarkPreferencesMapper.class, Text.class, Text.class, SequenceFileOutputFormat.class); markPreferences.getConfiguration().set(TRAINING_PERCENTAGE, String.valueOf(trainingPercentage)); Job createTrainingSet = prepareJob(markedPrefs, trainingSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createTrainingSet.getConfiguration().set(PART_TO_USE, INTO_TRAINING_SET.toString()); Job createProbeSet = prepareJob(markedPrefs, probeSetPath, SequenceFileInputFormat.class, WritePrefsMapper.class, NullWritable.class, Text.class, TextOutputFormat.class); createProbeSet.getConfiguration().set(PART_TO_USE, INTO_PROBE_SET.toString());
public static void main(String[] args) throws Exception { ToolRunner.run(new DatasetSplitter(), args); }
public static void main(String[] args) throws Exception { ToolRunner.run(new DatasetSplitter(), args); }