public void pipeOutputAccumulate(Instance carrier, Pipe iteratedPipe) { Object data = carrier.getData(); if (! (data instanceof Token)) throw new IllegalArgumentException( "TokenSequence can only accumulator Token's" ); add( (Token)data ); }
public Instance pipe (Instance carrier) { String filename = (String)carrier.getData(); try { carrier.setData(pipe (new BufferedReader (new FileReader (filename)))); } catch (java.io.IOException e) { throw new IllegalArgumentException ("IOException"); } return carrier; }
private Tokenization doTokenize (Object obj) { Instance toked = new Instance (obj, null, null, null); tokenizationPipe.pipe (toked); return (Tokenization) toked.getData (); }
public Instance pipe (Instance carrier) { File directory = (File) carrier.getData(); carrier.setData(new FileIterator (directory, fileFilter, labelPattern)); return carrier; }
public Instance pipe (Instance carrier) { FeatureSequence fs = (FeatureSequence) carrier.getData(); carrier.setData(new FeatureVector (fs, binary)); return carrier; }
public Instance pipe (Instance carrier) { carrier.setData(new TokenSequence((CharSequence[]) carrier.getData())); return carrier; }
public Instance pipe (Instance carrier) { MentionPair pair = (MentionPair)carrier.getData(); Integer distance = new Integer (calcNPDistance (pair.getAntecedent().getElement(), pair.getReferent().getElement())); String featureName = new String("NPDistance").concat(distance.toString()); pair.setFeatureValue (featureName, 1); return carrier; }
public Instance pipe (Instance carrier) { MentionPair pair = (MentionPair)carrier.getData(); Mention ant = pair.getAntecedent(); Mention ref = pair.getReferent(); if ((ant != null) && (ref != null) && (ref.getString().equals(ant.getString()))) pair.setFeatureValue(new String("IdenticalString"), 1.0); return carrier; }
public void testOldCrf () { CRF4 crf = (CRF4) FileUtils.readObject (new File (oldCrfFile)); Instance inst = new Instance (testString, null, null, null, crf.getInputPipe ()); Sequence output = crf.transduce ((Sequence) inst.getData ()); String std = output.toString (); assertEquals (" B-PER I-PER O O", std); }
public Instance pipe (Instance carrier) { MentionPair pair = (MentionPair)carrier.getData(); if (!pair.nullPair()) { Integer distance = new Integer (pair.getReferent().getMalletPhrase().getSentence().getIndex() - pair.getAntecedent().getMalletPhrase().getSentence().getIndex()); String featureName = new String("SentenceDistance").concat(distance.toString()).concat("Pronoun").concat(pair.getReferent().getString().toUpperCase()); pair.setFeatureValue (featureName, 1); } return carrier; }
public Instance pipe (Instance carrier) { NodePair pair = (NodePair)carrier.getData(); Citation s1 = (Citation)pair.getObject1(); Citation s2 = (Citation)pair.getObject2(); carrier.setSource(new String( "Citation1:"+s1.getOrigString()+"\nCitation2:"+s2.getOrigString() ) ); return carrier; }
public Classification classify (Instance instance) { FeatureVector fv = (FeatureVector) instance.getData (instancePipe); assert (instancePipe == null || fv.getAlphabet () == this.instancePipe.getDataAlphabet ()); Node leaf = getLeaf (root, fv); return new Classification (instance, this, leaf.labeling); }
public Instance pipe (Instance carrier) { NodeClusterPair pair = (NodeClusterPair)carrier.getData(); Citation node = (Citation)pair.getNode(); Collection cluster = (Collection)pair.getCluster(); for (int i=0; i < fields.length; i++) { String nodeValue = node.getField(fields[i]); if (matchesAtLeastNInCluster (fields[i], nodeValue, cluster, 1)) pair.setFeatureValue ("Same_"+fields[i]+"_thereExists", 1.0); } return carrier; }
public Instance pipe (Instance carrier) { VenuePaperCluster pair = (VenuePaperCluster)carrier.getData(); carrier.setSource(pair); AugmentableFeatureVector vec = new AugmentableFeatureVector((Alphabet)getDataAlphabet(), pair.getFeatures(), false); carrier.setData(vec); return carrier; } }
public Instance pipe (Instance carrier) { MentionPair pair = (MentionPair)carrier.getData(); double femaleness1 = calcFemaleness (pair.getAntecedent().getElement()); double femaleness2 = calcFemaleness (pair.getReferent().getElement()); pair.setFeatureValue("GenderDifference", Math.abs(femaleness1 - femaleness2)); return carrier; }
/** Adds to this list every instance generated by the iterator, * passing each one through this list's pipe. Checks are made to * ensure an OutOfMemoryError is not thrown when instantiating a new * Instance. */ public void add (PipeInputIterator pi) { while (pi.hasNext()) { Instance carrier = pi.nextInstance(); add (carrier.getData(), carrier.getTarget(), carrier.name, carrier.getSource()); } }
public Classification classify (Instance instance) { FeatureVector fv = (FeatureVector) instance.getData (instancePipe); assert (instancePipe == null || fv.getAlphabet () == this.instancePipe.getDataAlphabet ()); Node leaf = getLeaf(m_root, fv); return new Classification (instance, this, leaf.getGainRatio().getBaseLabelDistribution()); }
public void testOneFromSerialized () throws IOException, ClassNotFoundException { SerialPipes.setSuppressExceptions (false); Pipe p = createIteratingPipe (); Pipe clone = (Pipe) TestSerializable.cloneViaSerialization (p); InstanceList ilist = (InstanceList) new Instance (data, null, null, null, clone).getData(); assertTrue (ilist.size() == 3); }
/** Adds to this list every instance generated by the iterator, * passing each one through this list's pipe. */ public void add (PipeInputIterator pi) { int i=0; while (pi.hasNext()) { Instance carrier = pi.nextInstance(); // xxx Perhaps try to arrange this so that a new Instance does not have to allocated. add (new Instance (carrier.getData(), carrier.getTarget(), carrier.name, carrier.getSource(), this.pipe)); } }
public String viterbiCRFInstance(Instance instance, boolean sgml ) { assert(crf != null); viterbiP = crf.viterbiPath((Sequence)instance.getData());// regular viterbi viterbiSequence = viterbiP.output(); // confidence = Math.exp(viterbiP.getCost()/viterbiSequence.size()); // confidence = viterbiP.getCost()/viterbiSequence.size(); instance_accuracy= InstanceAccuracy(viterbiSequence, (Sequence)instance.getTarget(), instance); tokenSequence = (TokenSequence)instance.getSource(); assert(viterbiSequence.size() == tokenSequence.size()); return printResultInFormat(sgml); }