org.apache.stanbol.enhancer.nlp.model.AnalysedText.getSpan java code examples

private Occurrence(Section sentence,Token start,Token end){
  this.start = start.getStart();
  this.end = end.getEnd();
  String context = sentence.getSpan();
  if(context.length() > MAX_CONTEXT_LENGTH){
    context = start.getContext().getSpan().substring(
      Math.max(0, this.start-CONTEXT_TOKEN_COUNT),
      Math.min(this.end+CONTEXT_TOKEN_COUNT, start.getContext().getEnd())-1);
  }
  this.context = context;
}
/**

private Occurrence(Section sentence,Token start,Token end){
  this.start = start.getStart();
  this.end = end.getEnd();
  String context = sentence.getSpan();
  if(context.length() > MAX_CONTEXT_LENGTH){
    context = start.getContext().getSpan().substring(
      Math.max(0, this.start-CONTEXT_TOKEN_COUNT),
      Math.min(this.end+CONTEXT_TOKEN_COUNT, start.getContext().getEnd())-1);
  }
  this.context = context;
}
/**

private List<Section> detectSentences(AnalysedText at, String language) {
  SentenceDetector sentenceDetector = getSentenceDetector(language);
  List<Section> sentences;
  if(sentenceDetector != null){
    sentences = new ArrayList<Section>();
    for(opennlp.tools.util.Span sentSpan : sentenceDetector.sentPosDetect(at.getSpan())) {
      Sentence sentence = at.addSentence(sentSpan.getStart(), sentSpan.getEnd());
      log.trace(" > add {}",sentence);
      sentences.add(sentence);
    }
  } else {
    sentences = null;
  }
  return sentences;
}

contextElements.add(sentence);
String context = at.getSpan().substring(
  sentences.get(Math.max(0, i-1)).getStart(),
  sentences.get(Math.min(sentences.size()-1, i+1)).getEnd());
  String name = at.getSpan().substring(tokens.get(nameSpans[j].getStart()).getStart(), 
    tokens.get(nameSpans[j].getEnd()-1).getEnd());
  Double confidence = 1.0;

if(log.isDebugEnabled()){
  log.debug("computeEnhancements for ContentItem {} language {} text={}", 
    new Object []{ci.getUri().getUnicodeString(), language, StringUtils.abbreviate(at.getSpan(), 100)});

new Object []{ci.getUri().getUnicodeString(), language, StringUtils.abbreviate(at.getSpan(), 100)});

if(log.isDebugEnabled()){
  log.debug("computeEnhancements for ContentItem {} language {} text={}", 
    new Object []{ci.getUri().getUnicodeString(), language, StringUtils.abbreviate(at.getSpan(), 100)});

SentenceDetector sentenceDetector = getSentenceDetector(language);
if(sentenceDetector != null){
  for(opennlp.tools.util.Span sentSpan : sentenceDetector.sentPosDetect(at.getSpan())) {

if(log.isDebugEnabled()){
  log.debug("computeEnhancements from AnalysedText ContentPart of ContentItem {}: text={}",
    ci.getUri().getUnicodeString(), StringUtils.abbreviate(at.getSpan(), 100));

  content = at.getSpan();
} else { //no analyzed text ... read is from the text/plain blob
  try {

log.debug("findNamedEntities model={},  language={}, text=", 
    new Object[]{ nameFinderModel, language, 
           StringUtils.abbreviate(at != null ? at.getSpan() : text, 100) });

List<LexicalEntry> terms;
try {
  terms = this.client.performMorfologicalAnalysis(at.getSpan(), language);
} catch (IOException e) {
  throw new EngineException("Error while calling the CELI Lemmatizer"

String phraseText = at.getSpan().substring(sentPhrase.getStartIndex(), sentPhrase.getEndIndex());
metadata.add(new TripleImpl(enh, ENHANCER_SELECTED_TEXT, 
  new PlainLiteralImpl(phraseText, lang)));
  metadata.add(new TripleImpl(enh, ENHANCER_SELECTION_CONTEXT, 
    new PlainLiteralImpl(getSelectionContext(
      at.getSpan(), phraseText, sentPhrase.getStartIndex()),lang)));
} else {
  metadata.add(new TripleImpl(enh, ENHANCER_SELECTION_CONTEXT,

  nerList.get(nerSentIndex).context = lastSent.getSpan();
} else { //no sentence detected
  nerList.get(nerSentIndex).context = at.getSpan();
IRI ta = EnhancementEngineHelper.createTextEnhancement(ci, this);
metadata.add(new TripleImpl(ta, ENHANCER_SELECTED_TEXT, new PlainLiteralImpl(
  at.getSpan().substring(nerData.start, nerData.end),lang)));
metadata.add(new TripleImpl(ta, DC_TYPE, nerData.tag.getType()));
metadata.add(new TripleImpl(ta, ENHANCER_START, lf.createTypedLiteral(nerData.start)));

metadata.add(new TripleImpl(ta, ENHANCER_SELECTION_CONTEXT, 
  new PlainLiteralImpl(context == null ?
      getDefaultSelectionContext(at.getSpan(), span.getSpan(), span.getStart()) :
        context.getSpan(), lang)));

graph.add(new TripleImpl(segment, Nif20.endIndex.getUri(), 
  lf.createTypedLiteral(span.getEnd())));
String content = text.getSpan();
if(span.getType() != SpanTypeEnum.Text){

Popular methods of AnalysedText

getSentences
All sentences of the Analysed texts. Returned Iterators MUST NOT throw ConcurrentModificationExcepti
getEnclosed
addChunk
Adds an Chunk
addSentence
Adds an Sentence
getEnd
getText
Getter for the text.
getTokens
addToken
getBlob
The analysed Blob. Typically Blob#getMimeType() will betext/plain.
getChunks
All Chunks of this analysed text. Returned Iterators MUST NOT throw ConcurrentModificationExceptionb

Popular in Java

Updating database using SQL prepared statement
orElseThrow (Optional)
Return the contained value, if present, otherwise throw an exception to be created by the provided s
setScale (BigDecimal)
getApplicationContext (Context)
RandomAccessFile (java.io)
Allows reading from and writing to a file in a random-access manner. This is different from the uni-
Thread (java.lang)
A thread is a thread of execution in a program. The Java Virtual Machine allows an application to ha
ResourceBundle (java.util)
ResourceBundle is an abstract class which is the superclass of classes which provide Locale-specifi
Callable (java.util.concurrent)
A task that returns a result and may throw an exception. Implementors define a single method with no
Rectangle (java.awt)
A Rectangle specifies an area in a coordinate space that is enclosed by the Rectangle object's top-
JFrame (javax.swing)
From CI to AI: The AI layer in your organization

How to use getSpanmethodin org.apache.stanbol.enhancer.nlp.model.AnalysedText

Best Java code snippets using org.apache.stanbol.enhancer.nlp.model.AnalysedText.getSpan (Showing top 16 results out of 315)

How to use
getSpan
method
in
org.apache.stanbol.enhancer.nlp.model.AnalysedText