private static TcFeatureSet getFeatureNamesMinusOne(TcFeature[] names, int i) { TcFeatureSet nameList = new TcFeatureSet(names); nameList.setFeatureSetName(LEFTOUT_FE + names[i].getDiscriminatorValue()); nameList.remove(i); return nameList; }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet(TcFeatureFactory.create(TokenRatioPerDocument.class), TcFeatureFactory.create(CharacterNGram.class, CharacterNGram.PARAM_NGRAM_USE_TOP_K, 50)); }
private Set<Feature> getDense(JCas aJCas, TextClassificationTarget aTarget, FeatureExtractorResource_ImplBase aFeatExtractor) throws TextClassificationException { return ((FeatureExtractor) aFeatExtractor).extract(aJCas, aTarget); }
private String getId(Instance i) { int jcasId = i.getJcasId(); int sequenceId = i.getSequenceId(); return "" + jcasId + "_" + sequenceId; }
public TcFeatureSet(TcFeature... features) { for (TcFeature f : features) { add(f); } }
@Override public String toString() { return (String) getDiscriminatorValue(); } }
@Override public void applyFilter(FeatureStore store) { if (store.isSettingFeatureNamesAllowed()) { store.setFeatureNames(this.trainingFeatureNames); } }
@Override public TcFeature current() { // When calling next() after rewind() to position current() at the first // dimension value, no config has been set yet. At this point just // do nothing. if (config == null) { return null; } closures[current].setConfig(config); return closures[current]; }
public Feature(String name, Object value, FeatureType type) throws TextClassificationException { this.name = escaper.escape(name); this.value = value; this.isDefaultValue = false; this.type = type; }
@Override public Instance next() { Instance instance; instance = featureStore.getInstance(instanceCounter); instanceCounter++; return instance; }
@Override public boolean hasNext() { return instanceCounter < featureStore.getNumberOfInstances(); }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet( TcFeatureFactory.create(WordNGram.class) ); }
private static TcFeatureSet getFeatureNamesMinusOne(TcFeature[] names, int i) { TcFeatureSet nameList = new TcFeatureSet(names); nameList.setFeatureSetName(LEFTOUT_FE + names[i].getDiscriminatorValue()); nameList.remove(i); return nameList; }
public TcFeatureSet(String featureSetName, TcFeature... features) { this.featureSetName = featureSetName; for (TcFeature f : features) { add(f); } }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet(TcFeatureFactory.create(TokenRatioPerDocument.class), TcFeatureFactory.create(WordNGram.class, WordNGram.PARAM_NGRAM_USE_TOP_K, 600, WordNGram.PARAM_NGRAM_MIN_N, 1, WordNGram.PARAM_NGRAM_MAX_N, 3)); }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet(TcFeatureFactory.create(SentenceRatioPerDocument.class), TcFeatureFactory.create(LengthFeatureNominal.class), TcFeatureFactory.create(TokenRatioPerDocument.class)); }
private static TcFeatureSet getFeatureSet() { return new TcFeatureSet("DummyFeatureSet", TcFeatureFactory.create(TokenRatioPerDocument.class), TcFeatureFactory.create(CharacterNGram.class, CharacterNGram.PARAM_NGRAM_USE_TOP_K, 500, CharacterNGram.PARAM_NGRAM_MIN_N, 1, CharacterNGram.PARAM_NGRAM_MAX_N, 3)); }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet( TcFeatureFactory.create(DiffNrOfTokensPairFeatureExtractor.class)); }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet(TcFeatureFactory.create(TokenRatioPerDocument.class), TcFeatureFactory.create(InitialCharacterUpperCase.class)); }
public TcFeatureSet getFeatureSet() { return new TcFeatureSet(TcFeatureFactory.create(CharacterNGram.class)); }