public void addCluster( Cluster cluster ) { if( getModelSchema().getExpectedFieldNames().size() != cluster.getPointsSize() ) throw new IllegalArgumentException( "given points must be same size as active fields" ); cluster.setOrdinal( getClusters().size() + 1 ); this.clusters.add( cluster ); }
public ClusterEvaluator[] getClusterEvaluator( Fields argumentFields ) { List<Cluster> sorted = new ArrayList<Cluster>( clusters ); final DataField predictedField = getModelSchema().getPredictedField( getModelSchema().getPredictedFieldNames().get( 0 ) ); // order tables in category order as this is the declared field name order if( predictedField instanceof CategoricalDataField ) { Ordering<Cluster> ordering = Ordering.natural().onResultOf( new Function<Cluster, Comparable>() { @Override public Comparable apply( Cluster cluster ) { return ( (CategoricalDataField) predictedField ).getCategories().indexOf( cluster.getTargetCategory() ); } } ); Collections.sort( sorted, ordering ); } ClusterEvaluator[] clusterEvaluators = new ClusterEvaluator[ sorted.size() ]; for( int i = 0; i < sorted.size(); i++ ) clusterEvaluators[ i ] = new ClusterEvaluator( argumentFields, sorted.get( i ), getComparisonMeasure(), getDefaultCompareFunction() ); return clusterEvaluators; }
@Override public void operate( FlowProcess flowProcess, FunctionCall<Context<EvaluatorContext>> functionCall ) { ClusterEvaluator[] evaluators = functionCall.getContext().payload.evaluators; double[] results = functionCall.getContext().payload.results; for( int i = 0; i < evaluators.length; i++ ) results[ i ] = evaluators[ i ].evaluate( functionCall.getArguments() ); LOG.debug( "results: {}", results ); // calc min distance double min = Doubles.min( results ); int index = Doubles.indexOf( results, min ); String category = evaluators[ index ].getTargetCategory(); LOG.debug( "category: {}", category ); // emit distance, and intermediate cluster category scores if( !getSpec().getModelSchema().isIncludePredictedCategories() ) { functionCall.getOutputCollector().add( functionCall.getContext().result( category ) ); return; } Tuple result = functionCall.getContext().tuple; result.set( 0, category ); for( int i = 0; i < results.length; i++ ) result.set( i + 1, results[ i ] ); functionCall.getOutputCollector().add( result ); } }