org.apache.stanbol.enhancer.nlp.model.Token.getStart java code examples

/**
 * Checks the {@link #start} {@link #end} values against the span selected
 * by the parsed token.<p>
 * This method is called by all others that do add tokens.
 * @param token the added token
 */
private void checkSpan(Token token) {
  if(start > token.getStart()){
    start = token.getStart();
  }
  if(end < token.getEnd()){
    end = token.getEnd();
  }
}

@Override
public Chunk createChunk(Token start, Token end) {
  if(start == null || end == null){
    throw new IllegalArgumentException("Parst start Token '" + start
      + "' and end Token '" + end +"' MUST NOT be NULL!");
  }
  lock.writeLock().lock();
  try {
    return at.addChunk(start.getStart(), end.getEnd());
  } finally {
    lock.writeLock().unlock();  
  }
}

/**
 * Everytime the entityLinker starts to process a token we need to check
 * if we need to add additional contextual information from the {@link ContentItem}
 * to the {@link InMemoryEntityIndex}
 */
@Override
public void startToken(Token token) {
  log.debug(" > start token: {}",token);
  final Integer actIndex = token.getStart();
  if(actIndex > lastIndex){
    for(Collection<EntityMention> mentions : mentionIndex.subMap(lastIndex, actIndex).values()){
      for(EntityMention mention : mentions){
        addEntity(mention);
      }
    }
    lastIndex = actIndex;
  } else if(lastIndex > actIndex){
    log.warn("Token {} has earlier start index as the last one {}!", token, lastIndex);
  } // else the same index ... ignore
}

/**
 * Creates a new Linked Entity including the first {@link Occurrence}
 * @param section the sentence (context) for the occurrence.
 * @param startToken the index of the start token
 * @param tokenSpan the number of token included in this span
 * @param suggestions the entity suggestions
 * @param types the types of the linked entity. 
 */
protected LinkedEntity(Section section,Token startToken,Token endToken, 
            List<Suggestion> suggestions, Set<IRI> types) {
  this(startToken.getSpan().substring(startToken.getStart(), endToken.getEnd()),
    suggestions,types);
  addOccurrence(section, startToken,endToken);
}
/**

/**
 * Creates a new Linked Entity including the first {@link Occurrence}
 * @param section the sentence (context) for the occurrence.
 * @param startToken the index of the start token
 * @param tokenSpan the number of token included in this span
 * @param suggestions the entity suggestions
 * @param types the types of the linked entity. 
 */
protected LinkedEntity(Section section,Token startToken,Token endToken, 
            List<Suggestion> suggestions, Set<IRI> types) {
  this(startToken.getSpan().substring(startToken.getStart(), endToken.getEnd()),
    suggestions,types);
  addOccurrence(section, startToken,endToken);
}
/**

/**
 * Getter for the text covered by the next tokenCount tokens relative to
 * {@link #token}. It uses the {@link #textCache} to lookup/store such texts.
 * Given the Tokens
 * <pre>
 *    [This, is, an, Example]
 * </pre>
 * and the parameter <code>3</code> this method will return
 * <pre>
 *     This is an
 * </pre>
 * @param tokenCount the number of tokens to be included relative to 
 * {@link #tokenIndex}
 * @return the text covered by the span start of {@link #token} to end of
 * token at <code>{@link #tokenIndex}+tokenCount</code>.
 */
public String getTokenText(int start, int tokenCount){
  int offset = section.getStart();
  return section.getSpan().substring(
    tokens.get(start).token.getStart()-offset,
    tokens.get(start+(tokenCount-1)).token.getEnd()-offset);
}

/**
 * Getter for the text covered by the next tokenCount tokens relative to
 * {@link #token}. It uses the {@link #textCache} to lookup/store such texts.
 * Given the Tokens
 * <pre>
 *    [This, is, an, Example]
 * </pre>
 * and the parameter <code>3</code> this method will return
 * <pre>
 *     This is an
 * </pre>
 * @param tokenCount the number of tokens to be included relative to 
 * {@link #tokenIndex}
 * @return the text covered by the span start of {@link #token} to end of
 * token at <code>{@link #tokenIndex}+tokenCount</code>.
 */
public String getTokenText(int start, int tokenCount){
  int offset = section.getStart();
  return section.getSpan().substring(
    tokens.get(start).token.getStart()-offset,
    tokens.get(start+(tokenCount-1)).token.getEnd()-offset);
}

private Occurrence(Section sentence,Token start,Token end){
  this.start = start.getStart();
  this.end = end.getEnd();
  String context = sentence.getSpan();
  if(context.length() > MAX_CONTEXT_LENGTH){
    context = start.getContext().getSpan().substring(
      Math.max(0, this.start-CONTEXT_TOKEN_COUNT),
      Math.min(this.end+CONTEXT_TOKEN_COUNT, start.getContext().getEnd())-1);
  }
  this.context = context;
}
/**

private Occurrence(Section sentence,Token start,Token end){
  this.start = start.getStart();
  this.end = end.getEnd();
  String context = sentence.getSpan();
  if(context.length() > MAX_CONTEXT_LENGTH){
    context = start.getContext().getSpan().substring(
      Math.max(0, this.start-CONTEXT_TOKEN_COUNT),
      Math.min(this.end+CONTEXT_TOKEN_COUNT, start.getContext().getEnd())-1);
  }
  this.context = context;
}
/**

if(cursorToken.token.getStart() < endOffset){

phraseType.getPhraseType().name(), current.get(0).getStart(), 
current.get(current.size()-1).getEnd()});

String name = at.getSpan().substring(tokens.get(nameSpans[j].getStart()).getStart(), 
  tokens.get(nameSpans[j].getEnd()-1).getEnd());
Double confidence = 1.0;
  confidence *= probs[k];
int start = tokens.get(nameSpans[j].getStart()).getStart();
int end = start + name.length();
NerTag nerTag = config.getNerTag(nameSpans[j].getType());

  linkableTokenContext = linkableTokens.isEmpty() ? null : linkableTokens.get(0);
if(linkableTokenContext == null || linkableTokenContext.linkableToken.token.getStart() >= end){
      Math.max(start,linkableToken.token.getStart()),
      Math.min(end,linkableToken.token.getEnd())};
  if(mSpan[0] > start){
    for(int i = linkableToken.index-1; i >= 0; i--){
      TokenData token = tokens.get(i);
      int tStart = token.token.getStart();
      if(tStart < start){
        break;
        if(td.isMatchable){
          num++;
          if(match < 1 && td.token.getStart() >= start ||
              match > 0 && td.token.getEnd() <= end){
            match++;

    tokenList.get(i-chunkTokenCount).getStart(), 
    tokenList.get(i-1).getEnd());
  chunk.addAnnotation(PHRASE_ANNOTATION, 
  tokenList.get(i-chunkTokenCount).getStart(), 
  tokenList.get(i-1).getEnd());
chunk.addAnnotation(PHRASE_ANNOTATION,

while((token = nextToken(first)) != null){
  log.trace("  < [{},{}]:{} (link {}, match; {})",new Object[]{
      token.token.getStart(), token.token.getEnd(),token.getTokenText(),
      token.isLinkable, token.isMatchable});
  first = false;
    log.trace("lookup: token [{},{}]: {} | word [{},{}]:{}", new Object[]{
        offset.startOffset(), offset.endOffset(), termAtt,
        t.token.getStart(), t.token.getEnd(),
        t.getTokenText()});

activeChunk.matchableStartCharIndex = tokenData.token.getStart();

activeChunk.matchableStartCharIndex = tokenData.token.getStart();

this.value = value;
this.sentence = sentence;
this.start = token.getStart();
this.end = token.getEnd();
List<Value<PosTag>> tags = token.getAnnotations(NlpAnnotations.POS_ANNOTATION);

upperCase = token.getEnd() > token.getStart() && //not an empty token
    Character.isUpperCase(token.getSpan().codePointAt(0)); //and upper case
boolean isLinkablePos = false;

upperCase = token.getEnd() > token.getStart() && //not an empty token
    Character.isUpperCase(token.getSpan().codePointAt(0)); //and upper case
boolean isLinkablePos = false;

Popular methods of Token

Popular in Java

Making http post requests using okhttp
onCreateOptionsMenu (Activity)
getContentResolver (Context)
notifyDataSetChanged (ArrayAdapter)
SQLException (java.sql)
An exception that indicates a failed JDBC operation. It provides the following information about pro
Time (java.sql)
Java representation of an SQL TIME value. Provides utilities to format and parse the time's represen
Base64 (org.apache.commons.codec.binary)
Provides Base64 encoding and decoding as defined by RFC 2045.This class implements section 6.8. Base
IsNull (org.hamcrest.core)
Is the value null?
GridBagLayout (java.awt)
The GridBagLayout class is a flexible layout manager that aligns components vertically and horizonta
JButton (javax.swing)
From CI to AI: The AI layer in your organization

How to use getStartmethodin org.apache.stanbol.enhancer.nlp.model.Token

Best Java code snippets using org.apache.stanbol.enhancer.nlp.model.Token.getStart (Showing top 20 results out of 315)

How to use
getStart
method
in
org.apache.stanbol.enhancer.nlp.model.Token