@Override public void seal() { sealed = true; sortedStringList = new String[rawStringSet.size()]; rawStringSet.toArray(sortedStringList); Arrays.sort(sortedStringList); if (sortedStringList.length == 0) { min = null; max = null; return; } // Update min/max based on raw docs. min = sortedStringList[0]; max = sortedStringList[sortedStringList.length - 1]; // Merge the raw and aggregated docs, so stats for dictionary creation are collected correctly. int numAggregated = aggregatedStringSet.size(); if (numAggregated > 0) { rawStringSet.addAll(aggregatedStringSet); sortedStringList = new String[rawStringSet.size()]; rawStringSet.toArray(sortedStringList); Arrays.sort(sortedStringList); } } }
/** * Add the indexes and labels to the properties. * * @param properties */ public void writeMap(final Properties properties) { for (Map.Entry<MutableString, Integer> entry : this.indexedLabels.entrySet()) { properties.put("genotype.segment.label." + Integer.toString(entry.getValue()), entry.getKey().toString()); } properties.put("genotype.segment.label.numOfEntries", Integer.toString(this.indexedLabels.entrySet().size())); }
public int[] originalAssignment( final UncompressedWordVectors map, ArrayList<String> words, Object2IntOpenHashMap<String> order ) { final int len = map.vectors.entrySet().size(); int[] original = new int[ len ]; Random r = new Random(); for( int i = 0; i < len; i++ ) { original[ i ] = r.nextInt( words.size() ); } int j = 0; for( String s : words ) { original[ order.get( s ) ] = j++; } return original; }
SerializeExample.java: exportToXml private static void exportToXml() { XStream xstream = new XStream(new DomDriver()); try { FileWriter xmlFile = new FileWriter(XMLXML_FILE_NAME); ObjectContainer container = Db4o.openFile(DB4O_FILE_NAME); try { ObjectSet result = container.query(Car.class); Car[] cars = new Car[result.size()]; for (int i = 0; i < result.size(); i++) { Car car = (Car) result.next(); cars[i] = car; } String xml = xstream.toXML(cars); xmlFile.write("<?xml version=\"1.0\"?>\n" + xml); xmlFile.close(); } finally { container.close(); } } catch (Exception ex) { System.out.println(ex.getMessage()); } }
/** * k-means of the words in the vector file * @param k number of clusters * @param map vector * @return clustering of the words in the vector */ public Object2ObjectOpenHashMap<String, ClusterEntry> cluster( final int k, final UncompressedWordVectors map ) { final int len = map.vectors.keySet().size(); int[] original = new int[ len ]; Random r = new Random(); for( int i = 0; i < k; i++ ) { original[ i ] = i; } for( int i = k + 1; i < len; i++ ) { original[ i ] = r.nextInt( k ); } String[] words = new String[ map.vectors.keySet().size() ]; int z = 0; for( String s : map.vectors.keySet() ) { words[ z++ ] = s; } return cluster( k, map, original, words ); }