edu.stanford.nlp.ie.AbstractSequenceClassifier.classifyWithGlobalInformation java code examples

/**
 * Classify a List of IN using whatever additional information is passed in globalInfo.
 * Used by SUTime (NumberSequenceClassifier), which requires the doc date to resolve relative dates.
 *
 * @param tokenSequence The List of IN to be classified.
 * @return The classified List of IN, where the classifier output for
 *         each token is stored in its "answer" field.
 */
public List<IN> classifySentenceWithGlobalInformation(List<? extends HasWord> tokenSequence, final CoreMap doc, final CoreMap sentence) {
 List<IN> document = preprocessTokens(tokenSequence);
 classifyWithGlobalInformation(document, doc, sentence);
 return document;
}

private void recognizeNumberSequences(List<CoreLabel> words, final CoreMap document, final CoreMap sentence) {
 // we need to copy here because NumberSequenceClassifier overwrites the AnswerAnnotation
 List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);
 nsc.classifyWithGlobalInformation(newWords, document, sentence);
 // copy AnswerAnnotation back. Do not overwrite!
 // also, copy all the additional annotations generated by SUTime and NumberNormalizer
 for (int i = 0, sz = words.size(); i < sz; i++){
  CoreLabel origWord = words.get(i);
  CoreLabel newWord = newWords.get(i);
  // log.info(newWord.word() + " => " + newWord.get(CoreAnnotations.AnswerAnnotation.class) + " " + origWord.ner());
  String before = origWord.get(CoreAnnotations.AnswerAnnotation.class);
  String newGuess = newWord.get(CoreAnnotations.AnswerAnnotation.class);
  if ((before == null || before.equals(nsc.flags.backgroundSymbol) || before.equals("MISC")) && !newGuess.equals(nsc.flags.backgroundSymbol)) {
   origWord.set(CoreAnnotations.AnswerAnnotation.class, newGuess);
  }
  // transfer other annotations generated by SUTime or NumberNormalizer
  NumberSequenceClassifier.transferAnnotations(newWord, origWord);
 }
}

private void doOneSentenceNew(List<CoreLabel> words, Annotation doc, CoreMap sentence) {
 List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);
 nsc.classifyWithGlobalInformation(newWords, doc, sentence);
 Iterator<? extends CoreLabel> newFLIter = newWords.iterator();
 for (CoreLabel origWord : words) {
  CoreLabel newWord = newFLIter.next();
  String before = origWord.ner();
  String newGuess = newWord.get(CoreAnnotations.AnswerAnnotation.class);
  // log.info(origWord.word());
  // log.info(origWord.ner());
  if (VERBOSE)
   log.info(newWord);
  // log.info("-------------------------------------");
  if ((before == null || before.equals(BACKGROUND_SYMBOL) || before.equals("MISC"))
    && !newGuess.equals(BACKGROUND_SYMBOL)) {
   origWord.setNER(newGuess);
  }
  // transfer other annotations generated by SUTime or NumberNormalizer
  NumberSequenceClassifier.transferAnnotations(newWord, origWord);
 }
}

/**
 * Classify a List of IN using whatever additional information is passed in globalInfo.
 * Used by SUTime (NumberSequenceClassifier), which requires the doc date to resolve relative dates.
 *
 * @param tokenSequence The List of IN to be classified.
 * @return The classified List of IN, where the classifier output for
 *         each token is stored in its "answer" field.
 */
public List<IN> classifySentenceWithGlobalInformation(List<? extends HasWord> tokenSequence, final CoreMap doc, final CoreMap sentence) {
 List<IN> document = preprocessTokens(tokenSequence);
 classifyWithGlobalInformation(document, doc, sentence);
 return document;
}

 private void recognizeNumberSequences(List<CoreLabel> words, final CoreMap document, final CoreMap sentence) {
  // we need to copy here because NumberSequenceClassifier overwrites the AnswerAnnotation
  List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);

  nsc.classifyWithGlobalInformation(newWords, document, sentence);

  // copy AnswerAnnotation back. Do not overwrite!
  // also, copy all the additional annotations generated by SUTime and NumberNormalizer
  for (int i = 0, sz = words.size(); i < sz; i++){
   CoreLabel origWord = words.get(i);
   CoreLabel newWord = newWords.get(i);

   // System.err.println(newWord.word() + " => " + newWord.get(AnswerAnnotation.class) + " " + origWord.ner());

   String before = origWord.get(AnswerAnnotation.class);
   String newGuess = newWord.get(AnswerAnnotation.class);
   if ((before == null || before.equals(nsc.flags.backgroundSymbol) || before.equals("MISC")) && !newGuess.equals(nsc.flags.backgroundSymbol)) {
    origWord.set(AnswerAnnotation.class, newGuess);
   }

   // transfer other annotations generated by SUTime or NumberNormalizer
   NumberSequenceClassifier.transferAnnotations(newWord, origWord);

  }
 }
}

private void recognizeNumberSequences(List<CoreLabel> words, final CoreMap document, final CoreMap sentence) {
 // we need to copy here because NumberSequenceClassifier overwrites the AnswerAnnotation
 List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);
 nsc.classifyWithGlobalInformation(newWords, document, sentence);
 // copy AnswerAnnotation back. Do not overwrite!
 // also, copy all the additional annotations generated by SUTime and NumberNormalizer
 for (int i = 0, sz = words.size(); i < sz; i++){
  CoreLabel origWord = words.get(i);
  CoreLabel newWord = newWords.get(i);
  // System.err.println(newWord.word() + " => " + newWord.get(CoreAnnotations.AnswerAnnotation.class) + " " + origWord.ner());
  String before = origWord.get(CoreAnnotations.AnswerAnnotation.class);
  String newGuess = newWord.get(CoreAnnotations.AnswerAnnotation.class);
  if ((before == null || before.equals(nsc.flags.backgroundSymbol) || before.equals("MISC")) && !newGuess.equals(nsc.flags.backgroundSymbol)) {
   origWord.set(CoreAnnotations.AnswerAnnotation.class, newGuess);
  }
  // transfer other annotations generated by SUTime or NumberNormalizer
  NumberSequenceClassifier.transferAnnotations(newWord, origWord);
 }
}

private void recognizeNumberSequences(List<CoreLabel> words, final CoreMap document, final CoreMap sentence) {
 // we need to copy here because NumberSequenceClassifier overwrites the AnswerAnnotation
 List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);
 nsc.classifyWithGlobalInformation(newWords, document, sentence);
 // copy AnswerAnnotation back. Do not overwrite!
 // also, copy all the additional annotations generated by SUTime and NumberNormalizer
 for (int i = 0, sz = words.size(); i < sz; i++){
  CoreLabel origWord = words.get(i);
  CoreLabel newWord = newWords.get(i);
  // log.info(newWord.word() + " => " + newWord.get(CoreAnnotations.AnswerAnnotation.class) + " " + origWord.ner());
  String before = origWord.get(CoreAnnotations.AnswerAnnotation.class);
  String newGuess = newWord.get(CoreAnnotations.AnswerAnnotation.class);
  if ((before == null || before.equals(nsc.flags.backgroundSymbol) || before.equals("MISC")) && !newGuess.equals(nsc.flags.backgroundSymbol)) {
   origWord.set(CoreAnnotations.AnswerAnnotation.class, newGuess);
  }
  // transfer other annotations generated by SUTime or NumberNormalizer
  NumberSequenceClassifier.transferAnnotations(newWord, origWord);
 }
}

private void doOneSentenceNew(List<CoreLabel> words, Annotation doc, CoreMap sentence) {
 List<CoreLabel> newWords = NumberSequenceClassifier.copyTokens(words, sentence);
 nsc.classifyWithGlobalInformation(newWords, doc, sentence);
 Iterator<? extends CoreLabel> newFLIter = newWords.iterator();
 for (CoreLabel origWord : words) {
  CoreLabel newWord = newFLIter.next();
  String before = origWord.ner();
  String newGuess = newWord.get(CoreAnnotations.AnswerAnnotation.class);
  // log.info(origWord.word());
  // log.info(origWord.ner());
  if (VERBOSE)
   log.info(newWord);
  // log.info("-------------------------------------");
  if ((before == null || before.equals(BACKGROUND_SYMBOL) || before.equals("MISC"))
    && !newGuess.equals(BACKGROUND_SYMBOL)) {
   origWord.setNER(newGuess);
  }
  // transfer other annotations generated by SUTime or NumberNormalizer
  NumberSequenceClassifier.transferAnnotations(newWord, origWord);
 }
}

wrapper.processDocument(document);
classifyWithGlobalInformation(document, doc, sentence);

wrapper.processDocument(document);
classifyWithGlobalInformation(document, doc, sentence);

Javadoc

Classify a List of something that extends CoreMap using as additional information whatever is stored in the document and sentence. This is needed for SUTime (NumberSequenceClassifier), which requires the document date to resolve relative dates.

Popular methods of AbstractSequenceClassifier

classifySentence
Classify a List of IN. This method returns a new list of tokens, not the list of tokens passed in, a
backgroundSymbol
Returns the background class for the classifier.
classify
classifyAndWriteAnswers
classifyKBest
Takes a list of tokens and provides the K best sequence labelings of these tokens with their scores.
classifyToString
Classify the contents of a String to one of several String representations that shows the classes. P
classifyWithInlineXML
Classify the contents of a String. Plain text or XML is expected and the PlainTextDocumentReaderAndW
countResults
Count the successes and failures of the model on the given document. Fills numbers in to counters fo
getSequenceModel
getViterbiSearchGraph
labels
loadClassifier
Loads a classifier from the file, classpath resource, or URL specified by loadPath. If loadPath ends

Popular in Java

Reading from database using SQL prepared statement
getOriginalFilename (MultipartFile)
Return the original filename in the client's filesystem.This may contain path information depending
notifyDataSetChanged (ArrayAdapter)
compareTo (BigDecimal)
BufferedWriter (java.io)
Wraps an existing Writer and buffers the output. Expensive interaction with the underlying reader is
ConnectException (java.net)
A ConnectException is thrown if a connection cannot be established to a remote host on a specific po
Permission (java.security)
Legacy security code; do not use.
Collections (java.util)
This class consists exclusively of static methods that operate on or return collections. It contains
Vector (java.util)
Vector is an implementation of List, backed by an array and synchronized. All optional operations in
SAXParseException (org.xml.sax)
Encapsulate an XML parse error or warning.> This module, both source code and documentation, is in t
Github Copilot alternatives

How to use classifyWithGlobalInformationmethodin edu.stanford.nlp.ie.AbstractSequenceClassifier

Best Java code snippets using edu.stanford.nlp.ie.AbstractSequenceClassifier.classifyWithGlobalInformation (Showing top 10 results out of 315)

How to use
classifyWithGlobalInformation
method
in
edu.stanford.nlp.ie.AbstractSequenceClassifier