SnowballStemmer stemmer = new SnowballStemmer(); stemmer.setStemmer("English"); StringToWordVector STWfilter = new StringToWordVector(1000); STWfilter.setUseStoplist(true); STWfilter.setIDFTransform(true); STWfilter.setTFTransform(true); STWfilter.setNormalizeDocLength(new SelectedTag(StringToWordVector.FILTER_NORMALIZE_ALL, StringToWordVector.TAGS_FILTER)); STWfilter.setOutputWordCounts(true); STWfilter.setStemmer(stemmer); STWfilter.setInputFormat(train);
setNormalizeDocLength(new SelectedTag(Integer.parseInt(nString), TAGS_FILTER)); } else { setNormalizeDocLength(new SelectedTag(FILTER_NONE, TAGS_FILTER));
setNormalizeDocLength(new SelectedTag(Integer.parseInt(nString), TAGS_FILTER)); } else { setNormalizeDocLength(new SelectedTag(FILTER_NONE, TAGS_FILTER));