private void getSignature8(String word, StringBuilder sb) { sb.append('-'); boolean digit = true; for (int i = 0; i < word.length(); i++) { char c = word.charAt(i); if ( ! (Character.isDigit(c) || c == '.' || c == ',' || (i == 0 && (c == '-' || c == '+')))) { digit = false; } } // digit = false; // todo: Just turned off while we test it. if (digit) { sb.append("NUMBER"); } else { if (distSim == null) { distSim = new DistSimClassifier(wordClassesFile, false, true); // todo XXXX booleans depend on distsim file; need more options } String cluster = distSim.distSimClass(word); if (cluster == null) { cluster = "NULL"; } sb.append(cluster); } }
private void getSignature8(String word, StringBuilder sb) { sb.append('-'); boolean digit = true; for (int i = 0; i < word.length(); i++) { char c = word.charAt(i); if ( ! (Character.isDigit(c) || c == '.' || c == ',' || (i == 0 && (c == '-' || c == '+')))) { digit = false; } } // digit = false; // todo: Just turned off while we test it. if (digit) { sb.append("NUMBER"); } else { if (distSim == null) { distSim = new DistSimClassifier(wordClassesFile, false, true); // todo XXXX booleans depend on distsim file; need more options } String cluster = distSim.distSimClass(word); if (cluster == null) { cluster = "NULL"; } sb.append(cluster); } }
private void getSignature8(String word, StringBuilder sb) { sb.append('-'); boolean digit = true; for (int i = 0; i < word.length(); i++) { char c = word.charAt(i); if ( ! (Character.isDigit(c) || c == '.' || c == ',' || (i == 0 && (c == '-' || c == '+')))) { digit = false; } } // digit = false; // todo: Just turned off while we test it. if (digit) { sb.append("NUMBER"); } else { if (distSim == null) { distSim = new DistSimClassifier(wordClassesFile, false, true); // todo XXXX booleans depend on distsim file; need more options } String cluster = distSim.distSimClass(word); if (cluster == null) { cluster = "NULL"; } sb.append(cluster); } }
private void getSignature8(String word, StringBuilder sb) { sb.append('-'); boolean digit = true; for (int i = 0; i < word.length(); i++) { char c = word.charAt(i); if ( ! (Character.isDigit(c) || c == '.' || c == ',' || (i == 0 && (c == '-' || c == '+')))) { digit = false; } } // digit = false; // todo: Just turned off while we test it. if (digit) { sb.append("NUMBER"); } else { if (distSim == null) { distSim = new DistSimClassifier(wordClassesFile, false, true); // todo XXXX booleans depend on distsim file; need more options } String cluster = distSim.distSimClass(word); if (cluster == null) { cluster = "NULL"; } sb.append(cluster); } }