org.cleartk.ml.feature.extractor.CleartkExtractor$Preceding.<init> java code examples

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 // define chunking type
 this.chunking = new BioChunking<Token, Time>(Token.class, Time.class);
 // add features: word, character pattern, stem, pos
 this.tokenFeatureExtractors = Lists.newArrayList();
 this.tokenFeatureExtractors.add(new CoveredTextExtractor<Token>());
 NamedFeatureExtractor1<Token> ex = CharacterCategoryPatternFunction.createExtractor();
 this.tokenFeatureExtractors.add(ex);
 this.tokenFeatureExtractors.add(new TimeWordsExtractor<Token>());
 this.tokenFeatureExtractors.add(new TypePathExtractor<Token>(Token.class, "stem"));
 this.tokenFeatureExtractors.add(new TypePathExtractor<Token>(Token.class, "pos"));
   
 // add window of features before and after
 this.contextFeatureExtractors = Lists.newArrayList();
 for (FeatureExtractor1<Token> extractor : this.tokenFeatureExtractors) {
  this.contextFeatureExtractors.add(new CleartkExtractor<Token, Token>(Token.class, extractor, new Preceding(
    3), new Following(3)));
 }
}

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 // add features: word, stem, pos
 this.tokenFeatureExtractors = Lists.newArrayList();
 this.tokenFeatureExtractors.add(new CoveredTextExtractor<Token>());
 this.tokenFeatureExtractors.add(new TypePathExtractor<Token>(Token.class, "stem"));
 this.tokenFeatureExtractors.add(new TypePathExtractor<Token>(Token.class, "pos"));
 this.tokenFeatureExtractors.add(new ParentNodeFeaturesExtractor());
 // add window of features before and after
 this.contextExtractors = Lists.newArrayList();
 this.contextExtractors.add(new CleartkExtractor<Token, Token>(
   Token.class,
   new CoveredTextExtractor<Token>(),
   new Preceding(3),
   new Following(3)));
}

AssertionCuePhraseAnnotation.class,
baseExtractorCuePhraseCategory,
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(5)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(5))
);

 AssertionCuePhraseAnnotation.class,
 baseExtractorCuePhraseCategory,
 new CleartkExtractor.Bag(new CleartkExtractor.Preceding(5)),
 new CleartkExtractor.Bag(new CleartkExtractor.Following(5))
 );
new CleartkExtractor.Preceding(5),
new CleartkExtractor.Following(4),
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(10)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(10))
);
new TypePathExtractor(BaseToken.class, "partOfSpeech"),
new CleartkExtractor.LastCovered(2),
new CleartkExtractor.Preceding(3),
new CleartkExtractor.Following(2)
);

    new CleartkExtractor.Preceding(5),
    new CleartkExtractor.Following(4),
    new CleartkExtractor.Bag(new CleartkExtractor.Preceding(3)),
    new CleartkExtractor.Bag(new CleartkExtractor.Following(3)),
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(5)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(5)),
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(10)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(10))
    );

   new CleartkExtractor.Preceding( 5 ),
   new CleartkExtractor.Following( 4 ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 3 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 3 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 5 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 5 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 10 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 10 ) )
);
   new TypePathExtractor<>( BaseToken.class, "partOfSpeech" ),
   new CleartkExtractor.LastCovered( 2 ),
   new CleartkExtractor.Preceding( 3 ),
   new CleartkExtractor.Following( 2 )
);

   new CleartkExtractor.LastCovered( 2 ),     // Worked fine
   new CleartkExtractor.Preceding( 5 ),
   new CleartkExtractor.Following( 4 ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 3 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 3 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 5 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 5 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Preceding( 10 ) ),
   new CleartkExtractor.Bag( new CleartkExtractor.Following( 10 ) )
);

AssertionCuePhraseAnnotation.class,
baseExtractorCuePhraseCategory,
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(5)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(5))
);

 AssertionCuePhraseAnnotation.class,
 baseExtractorCuePhraseCategory,
 new CleartkExtractor.Bag(new CleartkExtractor.Preceding(5)),
 new CleartkExtractor.Bag(new CleartkExtractor.Following(5))
 );
new CleartkExtractor.Preceding(5),
new CleartkExtractor.Following(4),
new CleartkExtractor.Bag(new CleartkExtractor.Preceding(10)),
new CleartkExtractor.Bag(new CleartkExtractor.Following(10))
);
new TypePathExtractor(BaseToken.class, "partOfSpeech"),
new CleartkExtractor.LastCovered(2),
new CleartkExtractor.Preceding(3),
new CleartkExtractor.Following(2)
);

tgtExtractors.add(new TypePathExtractor<Time>(Time.class, "timeType"));
tgtExtractors.add(new TypePathExtractor<Time>(Time.class, "value"));
tgtExtractors.add(new CleartkExtractor<Time, Token>(Token.class, prepOrVerbExtractor, new Ngram(new Preceding(5))));
this.setTargetExtractors(tgtExtractors);

public void initialize(UimaContext context) throws ResourceInitializationException {
 simpleExtractors = Lists.newArrayList();
 FeatureExtractor1<Token> wordExtractor = new CoveredTextExtractor<Token>();
 CharacterNgramFeatureFunction.Orientation fromLeft = CharacterNgramFeatureFunction.Orientation.LEFT_TO_RIGHT;
 CharacterNgramFeatureFunction.Orientation fromRight = CharacterNgramFeatureFunction.Orientation.RIGHT_TO_LEFT;
 simpleExtractors.add(new FeatureFunctionExtractor<Token>(
   wordExtractor,
   new LowerCaseFeatureFunction(),
   new CapitalTypeFeatureFunction(),
   new NumericTypeFeatureFunction(),
   new CharacterNgramFeatureFunction(fromLeft, 0, 1),
   new CharacterNgramFeatureFunction(fromLeft, 0, 2),
   new CharacterNgramFeatureFunction(fromLeft, 0, 3),
   new CharacterNgramFeatureFunction(fromRight, 0, 1),
   new CharacterNgramFeatureFunction(fromRight, 0, 2),
   new CharacterNgramFeatureFunction(fromRight, 0, 3),
   new CharacterNgramFeatureFunction(fromRight, 0, 4),
   new CharacterNgramFeatureFunction(fromRight, 0, 5),
   new CharacterNgramFeatureFunction(fromRight, 0, 6)));
 windowExtractors = Lists.newArrayList();
 windowExtractors.add(new CleartkExtractor<Token, Token>(
   Token.class,
   wordExtractor,
   new Preceding(2),
   new Following(2)));
 windowNGramExtractors = Lists.newArrayList();
 windowNGramExtractors.add(new CleartkExtractor<Token, Token>(Token.class, wordExtractor, new Ngram(
   new Preceding(2)), new Ngram(new Following(2))));
}

public VerbClauseTemporalAnnotator() {
 this.eventID = 1;
 FeatureExtractor1<Token> precedingAuxiliaries = new CleartkExtractor<Token, Token>(
   Token.class,
   new TokenTextForSelectedPosExtractor("MD", "TO", "IN", "VB", "RB"),
   new Preceding(3));
 FeatureExtractor1<Token> tokenStemExtractor = new TypePathExtractor<Token>(Token.class, "stem");
 FeatureExtractor1<Token> tokenPOSExtractor = new TypePathExtractor<Token>(Token.class, "pos");
 this.sourceFeatureExtractors = Lists.newArrayList();
 this.sourceFeatureExtractors.add(new NamingExtractor1<Token>("Source", new CoveredTextExtractor<Token>()));
 this.sourceFeatureExtractors.add(new NamingExtractor1<Token>("Source", tokenPOSExtractor));
 this.sourceFeatureExtractors.add(new NamingExtractor1<Token>("Source", tokenStemExtractor));
 this.sourceFeatureExtractors.add(new NamingExtractor1<Token>("Source", precedingAuxiliaries));
 this.targetFeatureExtractors = Lists.newArrayList();
 this.targetFeatureExtractors.add(new NamingExtractor1<Token>("Target", new CoveredTextExtractor<Token>()));
 this.targetFeatureExtractors.add(new NamingExtractor1<Token>("Target", tokenPOSExtractor));
 this.targetFeatureExtractors.add(new NamingExtractor1<Token>("Target", tokenStemExtractor));
 this.targetFeatureExtractors.add(new NamingExtractor1<Token>("Target", precedingAuxiliaries));
 this.betweenAnchorsFeatureExtractors = new ArrayList<FeatureExtractor1<Annotation>>();
 this.betweenAnchorsFeatureExtractors.add(new NamingExtractor1<Annotation>(
   "WordsBetween",
   new CleartkExtractor<Annotation, Token>(Token.class, new CoveredTextExtractor<Token>(), new Bag(new Covered()))));
 this.pathExtractor = new TargetPathExtractor();
}

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 // the token feature extractor: text, char pattern (uppercase, digits, etc.), and part-of-speech
 this.extractor = new CombinedExtractor1<Token>(
   new FeatureFunctionExtractor<Token>(
     new CoveredTextExtractor<Token>(),
     new CharacterCategoryPatternFunction<Token>(PatternType.REPEATS_MERGED)),
   new TypePathExtractor<Token>(Token.class, "pos"));
 // the context feature extractor: the features above for the 3 preceding and 3 following tokens
 this.contextExtractor = new CleartkExtractor<Token, Token>(
   Token.class,
   this.extractor,
   new Preceding(3),
   new Following(3));
 // the chunking definition: Tokens will be combined to form NamedEntityMentions, with labels
 // from the "mentionType" attribute so that we get B-location, I-person, etc.
 this.chunking = new BioChunking<Token, NamedEntityMention>(
   Token.class,
   NamedEntityMention.class,
   "mentionType");
}

public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 // a feature extractor that creates features corresponding to the word, the word lower cased
 // the capitalization of the word, the numeric characterization of the word, and character ngram
 // suffixes of length 2 and 3.
 this.tokenFeatureExtractor = new FeatureFunctionExtractor<Token>(
   new CoveredTextExtractor<Token>(),
   new LowerCaseFeatureFunction(),
   new CapitalTypeFeatureFunction(),
   new NumericTypeFeatureFunction(),
   new CharacterNgramFeatureFunction(Orientation.RIGHT_TO_LEFT, 0, 2),
   new CharacterNgramFeatureFunction(Orientation.RIGHT_TO_LEFT, 0, 3));
 // a feature extractor that extracts the surrounding token texts (within the same sentence)
 this.contextFeatureExtractor = new CleartkExtractor<Token, Token>(
   Token.class,
   new CoveredTextExtractor<Token>(),
   new Preceding(2),
   new Following(2));
}

 public MentionClusterMentionFeaturesExtractor(String vectorFile) throws CleartkExtractorException {
  if(vectorFile != null){
   this.continuousText = new ContinuousTextExtractor(vectorFile);
   this.tokenVectorContext = new CleartkExtractor<>(
     BaseToken.class,
     continuousText,
     new FirstCovered(1),
     new LastCovered(1),
//          new Bag(new Covered()),
     new Preceding(1),
     new Following(1));
  }
 }

 public MentionClusterMentionFeaturesExtractor(String vectorFile) throws CleartkExtractorException {
  if(vectorFile != null){
   this.continuousText = new ContinuousTextExtractor(vectorFile);
   this.tokenVectorContext = new CleartkExtractor<>(
     BaseToken.class,
     continuousText,
     new FirstCovered(1),
     new LastCovered(1),
//          new Bag(new Covered()),
     new Preceding(1),
     new Following(1));
  }
 }

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 this.contextExtractors.add(new CleartkExtractor<Event, Token>(
   Token.class,
   new TokenTextForSelectedPosExtractor("RB", "MD", "TO", "IN"),
   new Bag(new Preceding(3))));
}

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 this.contextExtractors.add(new CleartkExtractor<Event, Token>(
   Token.class,
   new TokenTextForSelectedPosExtractor("RB"),
   new Bag(new Preceding(3))));
}

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 this.eventFeatureExtractors.add(new TextSliceExtractor<Event>(-2));
 this.eventFeatureExtractors.add(new CleartkExtractor<Event, Token>(Token.class, new TypePathExtractor<Token>(
   Token.class,
   "pos"), new Bag(new Covered())));
 this.contextExtractors.add(new CleartkExtractor<Event, Token>(
   Token.class,
   new TokenTextForSelectedPosExtractor("MD", "TO", "IN", "VB"),
   new Preceding(3)));
}

@Override
public void initialize(UimaContext context) throws ResourceInitializationException {
 super.initialize(context);
 this.eventFeatureExtractors.add(new CleartkExtractor<Event, Token>(Token.class, new TypePathExtractor<Token>(
   Token.class,
   "pos"), new Bag(new Covered())));
 this.contextExtractors.add(new CleartkExtractor<Event, Token>(
   Token.class,
   new TokenTextForSelectedPosExtractor("VB"),
   new Bag(new Preceding(3))));
}

Javadoc

Constructs a context that will extract features over the preceding N annotations.

Popular methods of CleartkExtractor$Preceding

extract

Popular in Java

Finding current android device location
scheduleAtFixedRate (Timer)
findViewById (Activity)
setContentView (Activity)
ByteBuffer (java.nio)
A buffer for bytes. A byte buffer can be created in either one of the following ways: * #allocate
Date (java.sql)
A class which can consume and produce dates in SQL Date format. Dates are represented in SQL as yyyy
BitSet (java.util)
The BitSet class implements abit array [http://en.wikipedia.org/wiki/Bit_array]. Each element is eit
TreeSet (java.util)
TreeSet is an implementation of SortedSet. All optional operations (adding and removing) are support
ReentrantLock (java.util.concurrent.locks)
A reentrant mutual exclusion Lock with the same basic behavior and semantics as the implicit monitor
VirtualMachine (com.sun.tools.attach)
A Java virtual machine. A VirtualMachine represents a Java virtual machine to which this Java vir
Top Vim plugins

How to use org.cleartk.ml.feature.extractor.CleartkExtractor$Precedingconstructor

Best Java code snippets using org.cleartk.ml.feature.extractor.CleartkExtractor$Preceding.<init> (Showing top 20 results out of 315)

How to use
org.cleartk.ml.feature.extractor.CleartkExtractor$Preceding
constructor