/** * Compute the maxent classification of an instance. * * @param classifier the classifier * @param features the features that are on for this instance * @return the classification */ static public Classification classify(Classifier classifier, String[] features) { return classifier.classify( new Instance(new TokenSequence(features), null, null, null)); }
/** * Compute the maxent classification of an instance. * * @param classifier the classifier * @param features the features that are on for this instance * @return the classification */ static public Classification classify(Classifier classifier, String[] features) { return classifier.classify( new Instance(new TokenSequence(features), null, null, null)); }
private TokenSequence makeTokenSeq(List<String> vals) { TokenSequence ts = new TokenSequence(vals.size()); for (String s : vals) { ts.add(s); } return ts; } }
private TokenSequence makeTokenSeq(List<String> vals) { TokenSequence ts = new TokenSequence(vals.size()); for (String s : vals) { ts.add(s); } return ts; } }
/** * Compute the maxent classification of an instance. * * @param classifier the classifier * @param features the features that are on for this instance * @return the classification */ static public Classification classify(Classifier classifier, String[] features) { return classifier.classify( new Instance(new TokenSequence(features), null, null, null)); }
private TokenSequence makeTokenSeq(List<String> vals) { TokenSequence ts = new TokenSequence(vals.size()); for (String s : vals) { ts.add(s); } return ts; } }
public Instance pipe (Instance carrier) { if (!(carrier.getData() instanceof CharSequence)) throw new IllegalArgumentException (); String s = carrier.getData().toString(); String[] lines = s.split (System.getProperty ("line.separator")); carrier.setData (new TokenSequence (lines)); return carrier; }
public Instance pipe (Instance carrier) { if (!(carrier.getData() instanceof CharSequence)) throw new IllegalArgumentException (); String s = carrier.getData().toString(); String[] lines = s.split (System.getProperty ("line.separator")); carrier.setData (new TokenSequence (lines)); return carrier; }
public Instance pipe (Instance carrier) { if (!(carrier.getData() instanceof CharSequence)) throw new IllegalArgumentException (); String s = carrier.getData().toString(); String[] lines = s.split (System.getProperty ("line.separator")); carrier.setData (new TokenSequence (lines)); return carrier; }
public Instance pipe (Instance carrier) { carrier.setData(new TokenSequence((CharSequence[]) carrier.getData())); return carrier; }
public Instance pipe (Instance carrier) { carrier.setData(new TokenSequence((CharSequence[]) carrier.getData())); return carrier; }
public Instance pipe (Instance carrier) { carrier.setData(new TokenSequence((CharSequence[]) carrier.getData())); return carrier; }
public TokenSequence randomTokenSequence (Randoms r, int length) { FeatureSequence fs = randomFeatureSequence (r, length); TokenSequence ts = new TokenSequence (length); for (int i = 0; i < length; i++) ts.add (fs.getObjectAtPosition(i).toString()); return ts; }
public TokenSequence randomTokenSequence (Randoms r, int length) { FeatureSequence fs = randomFeatureSequence (r, length); TokenSequence ts = new TokenSequence (length); for (int i = 0; i < length; i++) ts.add (fs.getObjectAtPosition(i).toString()); return ts; }
public TokenSequence randomTokenSequence (Randoms r, int length) { FeatureSequence fs = randomFeatureSequence (r, length); TokenSequence ts = new TokenSequence (length); for (int i = 0; i < length; i++) ts.add (fs.getObjectAtPosition(i).toString()); return ts; }
public Instance pipe (Instance carrier) { if (carrier.getData() instanceof CharSequence) carrier.setData(new TokenSequence (ngramify ((CharSequence)carrier.getData()))); else if (carrier.getData() instanceof TokenSequence) { TokenSequence ts = (TokenSequence) carrier.getData(); TokenSequence ret = new TokenSequence (); for (int i = 0; i < ts.size(); i++) ret.add (ngramify (ts.get(i).getText()).toString()); carrier.setData(ret); } else throw new IllegalArgumentException ("Unhandled type "+carrier.getData().getClass()); return carrier; }
public Instance pipe (Instance carrier) { if (carrier.getData() instanceof CharSequence) carrier.setData(new TokenSequence (ngramify ((CharSequence)carrier.getData()))); else if (carrier.getData() instanceof TokenSequence) { TokenSequence ts = (TokenSequence) carrier.getData(); TokenSequence ret = new TokenSequence (); for (int i = 0; i < ts.size(); i++) ret.add (ngramify (ts.get(i).getText()).toString()); carrier.setData(ret); } else throw new IllegalArgumentException ("Unhandled type "+carrier.getData().getClass()); return carrier; }
@Override public Instance pipe(Instance carrier) { TokenSequence input = (TokenSequence) carrier.getData(); TokenSequence ouput = new TokenSequence(); for (int i = 0; i < input.size(); i++) { Token t = input.get(i); if (!stopwords.contains(t.getText())) { ouput.add(t); } } carrier.setData(ouput); return carrier; }
@Override public Instance pipe(Instance carrier) { TokenSequence input = (TokenSequence) carrier.getData(); TokenSequence ouput = new TokenSequence(); for (int i = 0; i < input.size(); i++) { Token t = input.get(i); if (!stopwords.contains(t.getText())) { ouput.add(t); } } carrier.setData(ouput); return carrier; }
public TextInstance(TextSentence textSentence, Alphabet targetAlphabet) { super(new TokenSequence(), new LabelSequence(targetAlphabet), textSentence.getId(), textSentence); TokenSequence tokenSequence = (TokenSequence) getData(); LabelSequence labelSequence = (LabelSequence) getTarget(); for (TextToken textToken : textSentence) { String text = textToken.getText(); String label = textToken.getTag(); tokenSequence.add(new Token(text)); labelSequence.add(label); } }