private boolean[] whoThinksThisIsTrue(String id1, String id2) { Record r1 = database.findRecordById(id1); if (r1 == null) r1 = secondary.get(id1); Record r2 = database.findRecordById(id2); if (r2 == null) r2 = secondary.get(id2); List<GeneticConfiguration> configs = population.getConfigs(); boolean[] believers = new boolean[configs.size()]; for (int ix = 0; ix < configs.size(); ix++) { Configuration config = configs.get(ix).getConfiguration(); Processor proc = new Processor(config, database); believers[ix] = proc.compare(r1, r2) > config.getThreshold(); } return believers; } }
private static void reindex(Configuration config, Database database) { System.out.println("Reindexing all records..."); Processor processor = new Processor(config, database); if (config.isDeduplicationMode()) processor.index(config.getDataSources(), DEFAULT_BATCH_SIZE); else { processor.index(config.getDataSources(1), DEFAULT_BATCH_SIZE); processor.index(config.getDataSources(2), DEFAULT_BATCH_SIZE); } } }
@Before public void setup() throws IOException { listener = new TestUtils.TestListener(); Levenshtein comp = new Levenshtein(); List<Property> props = new ArrayList(); props.add(new PropertyImpl("ID")); props.add(new PropertyImpl("NAME", comp, 0.3, 0.8)); props.add(new PropertyImpl("EMAIL", comp, 0.3, 0.8)); config = new ConfigurationImpl(); config.setProperties(props); config.setThreshold(0.85); config.setMaybeThreshold(0.8); processor = new Processor(config, true); processor.addMatchListener(listener); }
Processor processor = new Processor(config, !noreindex); processor.setLogger(logger); processor.setThreads(threads);
MatchListener listener) { Configuration cconfig = config.getConfiguration(); Processor proc = new Processor(cconfig, database); TestFileListener eval = makeEval(cconfig, testdb, proc);
this.processor = new Processor(config, false); this.linkdb = makeLinkDatabase(props); processor.addMatchListener(new LinkDatabaseMatchListener(config, linkdb));
private static void reindex(Configuration config, Database database) { System.out.println("Reindexing all records..."); Processor processor = new Processor(config, database); if (config.isDeduplicationMode()) processor.index(config.getDataSources(), DEFAULT_BATCH_SIZE); else { processor.index(config.getDataSources(1), DEFAULT_BATCH_SIZE); processor.index(config.getDataSources(2), DEFAULT_BATCH_SIZE); } } }
Processor proc = new Processor(cconfig, database); TestFileListener eval = makeEval(cconfig, testdb, proc);
Processor processor = new Processor(config, !noreindex); processor.setLogger(logger); processor.setThreads(threads);
this.processor = new Processor(config, false); this.linkdb = makeLinkDatabase(props); processor.addMatchListener(new LinkDatabaseMatchListener(config, linkdb));