@Test public void toyIntegrationMaxSimilaritiesPerRow() throws Exception { File inputFile = getTestTempFile("rows"); File outputDir = getTestTempDir("output"); outputDir.delete(); File tmpDir = getTestTempDir("tmp"); Configuration conf = getConfiguration(); Path inputPath = new Path(inputFile.getAbsolutePath()); FileSystem fs = FileSystem.get(inputPath.toUri(), conf); assertNotNull(similarityMatrix); assertEquals(3, similarityMatrix.numCols()); assertEquals(3, similarityMatrix.numRows()); assertEquals(0.0, similarityMatrix.get(0, 0), EPSILON); assertEquals(0.5, similarityMatrix.get(0, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(0, 2), EPSILON); assertEquals(0.5, similarityMatrix.get(1, 0), EPSILON); assertEquals(0.0, similarityMatrix.get(1, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(1, 2), EPSILON); assertEquals(0.4, similarityMatrix.get(2, 0), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 2), EPSILON);
@Test public void testVectorDimensions() throws Exception { File inputFile = getTestTempFile("rows"); Configuration conf = getConfiguration(); Path inputPath = new Path(inputFile.getAbsolutePath()); FileSystem fs = FileSystem.get(inputPath.toUri(), conf); MathHelper.writeDistributedRowMatrix(new double[][] { new double[] { 1, 0, 1, 1, 0, 1 }, new double[] { 0, 1, 1, 1, 1, 1 }, new double[] { 1, 1, 0, 1, 0, 0 } }, fs, conf, inputPath); RowSimilarityJob rowSimilarityJob = new RowSimilarityJob(); rowSimilarityJob.setConf(conf); int numberOfColumns = rowSimilarityJob.getDimensions(inputPath); assertEquals(6, numberOfColumns); } }
File inputFile = getTestTempFile("rows"); File outputDir = getTestTempDir("output"); outputDir.delete(); File tmpDir = getTestTempDir("tmp"); Configuration conf = getConfiguration(); Path inputPath = new Path(inputFile.getAbsolutePath()); FileSystem fs = FileSystem.get(inputPath.toUri(), conf); assertNotNull(similarityMatrix); assertEquals(3, similarityMatrix.numCols()); assertEquals(3, similarityMatrix.numRows()); assertEquals(0.0, similarityMatrix.get(0, 0), EPSILON); assertEquals(0.5, similarityMatrix.get(0, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(0, 2), EPSILON); assertEquals(0.5, similarityMatrix.get(1, 0), EPSILON); assertEquals(0.0, similarityMatrix.get(1, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(1, 2), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 0), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 2), EPSILON);
File inputFile = getTestTempFile("rows"); File outputDir = getTestTempDir("output"); outputDir.delete(); File tmpDir = getTestTempDir("tmp"); Configuration conf = getConfiguration(); Path inputPath = new Path(inputFile.getAbsolutePath()); FileSystem fs = FileSystem.get(inputPath.toUri(), conf); assertEquals(4, observationsPerColumn.size()); assertEquals(1, observationsPerColumn.get(0)); assertEquals(2, observationsPerColumn.get(2)); assertEquals(2, observationsPerColumn.get(3)); assertEquals(1, observationsPerColumn.get(4)); assertNotNull(similarityMatrix); assertEquals(3, similarityMatrix.numCols()); assertEquals(3, similarityMatrix.numRows()); assertEquals(1.0, similarityMatrix.get(0, 0), EPSILON); assertEquals(1.0, similarityMatrix.get(1, 1), EPSILON); assertEquals(1.0, similarityMatrix.get(2, 2), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 0), EPSILON); assertEquals(0.0, similarityMatrix.get(2, 1), EPSILON); assertEquals(0.0, similarityMatrix.get(0, 2), EPSILON); assertEquals(0.0, similarityMatrix.get(1, 2), EPSILON); assertEquals(0.666666, similarityMatrix.get(0, 1), EPSILON); assertEquals(0.666666, similarityMatrix.get(1, 0), EPSILON);