public List<String> getStemmedPairs(final String text) throws IOException { String tmp = text.toLowerCase(); tmp = DiacriticsRemover.removeDiacritics(tmp); tmp = tmp.replaceAll("_", SPACE); tmp = tmp.replaceAll("\n", SPACE); tmp = tmp.replaceAll("[^a-z\\d-_/ ]", ""); List<String> strings = new ArrayList<String>(); PorterStemmer ps = new PorterStemmer(); for (String s : StringUtils.split(tmp, SPACE)) { if (!StopWordsRemover.isAnEnglishStopWords(s)) {; ps.add(s.toCharArray(), s.length()); ps.stem(); strings.add(ps.toString()); } } return strings; }
PorterStemmer ps = new PorterStemmer(); for (String s : StringUtils.split(tmp, SPACE)) { s = s.replaceAll("^[/\\-]+", "");
PorterStemmer s = new PorterStemmer(); for (int i = 0; i < args.length; i++) { try {
PorterStemmer stemmer = new PorterStemmer(); for(String string : DiacriticsRemover.removeDiacritics(inputDataStringBuilder.toString()) .toLowerCase().split(" ")){
vals_str = vals_str.replaceAll("[^a-z ]", ""); PorterStemmer ps = new PorterStemmer(); List<Tuple> alt = new ArrayList<Tuple>(); for (String s : vals_str.split(" ")) {