public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); String s = t.getText(); if (s.indexOf("&") != -1) { if (s.indexOf("&") != -1) // already friendly return carrier; else { s.replaceAll ("&", "&"); t.setText (s); } } } return carrier; } // Serialization
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); String s = t.getText(); if (s.indexOf("&") != -1) { if (s.indexOf("&") != -1) // already friendly return carrier; else { s.replaceAll ("&", "&"); t.setText (s); } } } return carrier; } // Serialization
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); String s = t.getText(); if (s.indexOf("&") != -1) { if (s.indexOf("&") != -1) // already friendly return carrier; else { s.replaceAll ("&", "&"); t.setText (s); } } } return carrier; } // Serialization
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); t.setText(t.getText().toLowerCase()); } return carrier; }
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); t.setText(t.getText().toLowerCase()); } return carrier; }
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); t.setText(t.getText().toLowerCase()); } return carrier; }
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); TokenSequence targetTokenSeq = new TokenSequence (ts.size()); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); Matcher matcher = regex.matcher (t.getText()); if (matcher.matches()) { targetTokenSeq.add (matcher.group(targetGroup)); t.setText (matcher.group (dataGroup)); } else { logger.warning ("Skipping token: No match of "+regex.pattern() +" at token #"+i+" with text "+t.getText()); } } carrier.setTarget(targetTokenSeq); carrier.setData(ts); return carrier; }
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); TokenSequence targetTokenSeq = new TokenSequence (ts.size()); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); Matcher matcher = regex.matcher (t.getText()); if (matcher.matches()) { targetTokenSeq.add (matcher.group(targetGroup)); t.setText (matcher.group (dataGroup)); } else { logger.warning ("Skipping token: No match of "+regex.pattern() +" at token #"+i+" with text "+t.getText()); } } carrier.setTarget(targetTokenSeq); carrier.setData(ts); return carrier; }
public Instance pipe (Instance carrier) { TokenSequence ts = (TokenSequence) carrier.getData(); TokenSequence targetTokenSeq = new TokenSequence (ts.size()); for (int i = 0; i < ts.size(); i++) { Token t = ts.get(i); Matcher matcher = regex.matcher (t.getText()); if (matcher.matches()) { targetTokenSeq.add (matcher.group(targetGroup)); t.setText (matcher.group (dataGroup)); } else { logger.warning ("Skipping token: No match of "+regex.pattern() +" at token #"+i+" with text "+t.getText()); } } carrier.setTarget(targetTokenSeq); carrier.setData(ts); return carrier; }
token.setText(currWord);
token.setFeatureValue(metaName + "=" + meta, 1); token.setText(currWord);
token.setText(currWord);