org.elasticsearch.index.mapper.ParsedDocument.rootDoc java code examples

/**
 * Makes the processing document as a tombstone document rather than a regular document.
 * Tombstone documents are stored in Lucene index to represent delete operations or Noops.
 */
ParsedDocument toTombstone() {
  assert docs().size() == 1 : "Tombstone should have a single doc [" + docs() + "]";
  this.seqID.tombstoneField.setLongValue(1);
  rootDoc().add(this.seqID.tombstoneField);
  return this;
}

public ParsedDocument createNoopTombstoneDoc(String index, String reason) throws MapperParsingException {
  final String id = ""; // _id won't be used.
  final SourceToParse sourceToParse = SourceToParse.source(index, type, id, new BytesArray("{}"), XContentType.JSON);
  final ParsedDocument parsedDoc = documentParser.parseDocument(sourceToParse, noopTombstoneMetadataFieldMappers).toTombstone();
  // Store the reason of a noop as a raw string in the _source field
  final BytesRef byteRef = new BytesRef(reason);
  parsedDoc.rootDoc().add(new StoredField(SourceFieldMapper.NAME, byteRef.bytes, byteRef.offset, byteRef.length));
  return parsedDoc;
}

private static Fields generateTermVectorsFromDoc(IndexShard indexShard, TermVectorsRequest request) throws IOException {
  // parse the document, at the moment we do update the mapping, just like percolate
  ParsedDocument parsedDocument =
    parseDocument(indexShard, indexShard.shardId().getIndexName(), request.type(), request.doc(), request.xContentType());
  // select the right fields and generate term vectors
  ParseContext.Document doc = parsedDocument.rootDoc();
  Set<String> seenFields = new HashSet<>();
  Collection<DocumentField> documentFields = new HashSet<>();
  for (IndexableField field : doc.getFields()) {
    MappedFieldType fieldType = indexShard.mapperService().fullName(field.name());
    if (!isValidField(fieldType)) {
      continue;
    }
    if (request.selectedFields() != null && !request.selectedFields().contains(field.name())) {
      continue;
    }
    if (seenFields.contains(field.name())) {
      continue;
    }
    else {
      seenFields.add(field.name());
    }
    String[] values = doc.getValues(field.name());
    documentFields.add(new DocumentField(field.name(), Arrays.asList((Object[]) values)));
  }
  return generateTermVectors(indexShard,
    XContentHelper.convertToMap(parsedDocument.source(), true, request.xContentType()).v2(), documentFields,
      request.offsets(), request.perFieldAnalyzer(), seenFields);
}

/**
 * Makes the processing document as a tombstone document rather than a regular document.
 * Tombstone documents are stored in Lucene index to represent delete operations or Noops.
 */
ParsedDocument toTombstone() {
  assert docs().size() == 1 : "Tombstone should have a single doc [" + docs() + "]";
  this.seqID.tombstoneField.setLongValue(1);
  rootDoc().add(this.seqID.tombstoneField);
  return this;
}

public ParsedDocument createNoopTombstoneDoc(String index, String reason) throws MapperParsingException {
  final String id = ""; // _id won't be used.
  final SourceToParse sourceToParse = SourceToParse.source(index, type, id, new BytesArray("{}"), XContentType.JSON);
  final ParsedDocument parsedDoc = documentParser.parseDocument(sourceToParse, noopTombstoneMetadataFieldMappers).toTombstone();
  // Store the reason of a noop as a raw string in the _source field
  final BytesRef byteRef = new BytesRef(reason);
  parsedDoc.rootDoc().add(new StoredField(SourceFieldMapper.NAME, byteRef.bytes, byteRef.offset, byteRef.length));
  return parsedDoc;
}

public void initialize(Engine.Searcher docSearcher, ParsedDocument parsedDocument) {
  this.docSearcher = docSearcher;
  IndexReader indexReader = docSearcher.reader();
  LeafReaderContext atomicReaderContext = indexReader.leaves().get(0);
  LeafSearchLookup leafLookup = lookup().getLeafSearchLookup(atomicReaderContext);
  leafLookup.setDocument(0);
  leafLookup.source().setSource(parsedDocument.source());
  Map<String, SearchHitField> fields = new HashMap<>();
  for (IndexableField field : parsedDocument.rootDoc().getFields()) {
    fields.put(field.name(), new InternalSearchHitField(field.name(), Collections.emptyList()));
  }
  hitContext().reset(
      new InternalSearchHit(0, "unknown", new Text(parsedDocument.type()), fields),
      atomicReaderContext, 0, docSearcher.searcher()
  );
}

  docSearcher = createMultiDocumentSearcher(analyzer, docs);
} else {
  MemoryIndex memoryIndex = MemoryIndex.fromDocument(docs.get(0).rootDoc(), analyzer, true, false);
  docSearcher = memoryIndex.createSearcher();
  docSearcher.setQueryCache(null);

  docSearcher = createMultiDocumentSearcher(analyzer, docs);
} else {
  MemoryIndex memoryIndex = MemoryIndex.fromDocument(docs.get(0).rootDoc(), analyzer, true, false);
  docSearcher = memoryIndex.createSearcher();
  docSearcher.setQueryCache(null);

private Fields generateTermVectorsFromDoc(TermVectorsRequest request, boolean doAllFields) throws Throwable {
  // parse the document, at the moment we do update the mapping, just like percolate
  ParsedDocument parsedDocument = parseDocument(indexShard.shardId().getIndex(), request.type(), request.doc());
  // select the right fields and generate term vectors
  ParseContext.Document doc = parsedDocument.rootDoc();
  Set<String> seenFields = new HashSet<>();
  Collection<GetField> getFields = new HashSet<>();
  for (IndexableField field : doc.getFields()) {
    MappedFieldType fieldType = indexShard.mapperService().smartNameFieldType(field.name());
    if (!isValidField(fieldType)) {
      continue;
    }
    if (request.selectedFields() == null && !doAllFields && !fieldType.storeTermVectors()) {
      continue;
    }
    if (request.selectedFields() != null && !request.selectedFields().contains(field.name())) {
      continue;
    }
    if (seenFields.contains(field.name())) {
      continue;
    }
    else {
      seenFields.add(field.name());
    }
    String[] values = doc.getValues(field.name());
    getFields.add(new GetField(field.name(), Arrays.asList((Object[]) values)));
  }
  return generateTermVectors(getFields, request.offsets(), request.perFieldAnalyzer(), seenFields);
}

private static Fields generateTermVectorsFromDoc(IndexShard indexShard, TermVectorsRequest request) throws IOException {
  // parse the document, at the moment we do update the mapping, just like percolate
  ParsedDocument parsedDocument =
    parseDocument(indexShard, indexShard.shardId().getIndexName(), request.type(), request.doc(), request.xContentType());
  // select the right fields and generate term vectors
  ParseContext.Document doc = parsedDocument.rootDoc();
  Set<String> seenFields = new HashSet<>();
  Collection<DocumentField> documentFields = new HashSet<>();
  for (IndexableField field : doc.getFields()) {
    MappedFieldType fieldType = indexShard.mapperService().fullName(field.name());
    if (!isValidField(fieldType)) {
      continue;
    }
    if (request.selectedFields() != null && !request.selectedFields().contains(field.name())) {
      continue;
    }
    if (seenFields.contains(field.name())) {
      continue;
    }
    else {
      seenFields.add(field.name());
    }
    String[] values = doc.getValues(field.name());
    documentFields.add(new DocumentField(field.name(), Arrays.asList((Object[]) values)));
  }
  return generateTermVectors(indexShard, XContentHelper.convertToMap(parsedDocument.source(), true, request.xContentType()).v2(),
    documentFields, request.offsets(), request.perFieldAnalyzer(), seenFields);
}

private static Fields generateTermVectorsFromDoc(IndexShard indexShard, TermVectorsRequest request) throws IOException {
  // parse the document, at the moment we do update the mapping, just like percolate
  ParsedDocument parsedDocument =
    parseDocument(indexShard, indexShard.shardId().getIndexName(), request.type(), request.doc(), request.xContentType());
  // select the right fields and generate term vectors
  ParseContext.Document doc = parsedDocument.rootDoc();
  Set<String> seenFields = new HashSet<>();
  Collection<DocumentField> documentFields = new HashSet<>();
  for (IndexableField field : doc.getFields()) {
    MappedFieldType fieldType = indexShard.mapperService().fullName(field.name());
    if (!isValidField(fieldType)) {
      continue;
    }
    if (request.selectedFields() != null && !request.selectedFields().contains(field.name())) {
      continue;
    }
    if (seenFields.contains(field.name())) {
      continue;
    }
    else {
      seenFields.add(field.name());
    }
    String[] values = doc.getValues(field.name());
    documentFields.add(new DocumentField(field.name(), Arrays.asList((Object[]) values)));
  }
  return generateTermVectors(indexShard, XContentHelper.convertToMap(parsedDocument.source(), true, request.xContentType()).v2(),
    documentFields, request.offsets(), request.perFieldAnalyzer(), seenFields);
}

private static Fields generateTermVectorsFromDoc(IndexShard indexShard, TermVectorsRequest request) throws IOException {
  // parse the document, at the moment we do update the mapping, just like percolate
  ParsedDocument parsedDocument =
    parseDocument(indexShard, indexShard.shardId().getIndexName(), request.type(), request.doc(), request.xContentType());
  // select the right fields and generate term vectors
  ParseContext.Document doc = parsedDocument.rootDoc();
  Set<String> seenFields = new HashSet<>();
  Collection<GetField> getFields = new HashSet<>();
  for (IndexableField field : doc.getFields()) {
    MappedFieldType fieldType = indexShard.mapperService().fullName(field.name());
    if (!isValidField(fieldType)) {
      continue;
    }
    if (request.selectedFields() != null && !request.selectedFields().contains(field.name())) {
      continue;
    }
    if (seenFields.contains(field.name())) {
      continue;
    }
    else {
      seenFields.add(field.name());
    }
    String[] values = doc.getValues(field.name());
    getFields.add(new GetField(field.name(), Arrays.asList((Object[]) values)));
  }
  return generateTermVectors(indexShard, XContentHelper.convertToMap(parsedDocument.source(), true, request.xContentType()).v2(),
    getFields, request.offsets(), request.perFieldAnalyzer(), seenFields);
}

@Override
public void prepare(PercolateContext context, ParsedDocument parsedDocument) {
  MemoryIndex memoryIndex = cache.get();
  for (IndexableField field : parsedDocument.rootDoc().getFields()) {
    if (field.fieldType().indexOptions() == IndexOptions.NONE && field.name().equals(UidFieldMapper.NAME)) {
      continue;
    }
    try {
      Analyzer analyzer = context.mapperService().documentMapper(parsedDocument.type()).mappers().indexAnalyzer();
      // TODO: instead of passing null here, we can have a CTL<Map<String,TokenStream>> and pass previous,
      // like the indexer does
      try (TokenStream tokenStream = field.tokenStream(analyzer, null)) {
        if (tokenStream != null) {
          memoryIndex.addField(field.name(), tokenStream, field.boost());
        }
       }
    } catch (Exception e) {
      throw new ElasticsearchException("Failed to create token stream for [" + field.name() + "]", e);
    }
  }
  context.initialize(new DocEngineSearcher(memoryIndex), parsedDocument);
}

Popular methods of ParsedDocument

docs
id
<init>
dynamicMappingsUpdate
Return dynamic updates to mappings or null if there were no updates to the mappings.
type
addDynamicMappingsUpdate
parent
routing
source
version
getXContentType
timestamp

Popular in Java

Making http requests using okhttp
getApplicationContext (Context)
setScale (BigDecimal)
getSystemService (Context)
ObjectMapper (com.fasterxml.jackson.databind)
ObjectMapper provides functionality for reading and writing JSON, either to and from basic POJOs (Pl
RandomAccessFile (java.io)
Allows reading from and writing to a file in a random-access manner. This is different from the uni-
String (java.lang)
GridLayout (java.awt)
The GridLayout class is a layout manager that lays out a container's components in a rectangular gri
BasicDataSource (org.apache.commons.dbcp)
Basic implementation of javax.sql.DataSource that is configured via JavaBeans properties. This is no
Scheduler (org.quartz)
This is the main interface of a Quartz Scheduler. A Scheduler maintains a registry of org.quartz.Job
Top 12 Jupyter Notebook extensions

How to use rootDocmethodin org.elasticsearch.index.mapper.ParsedDocument

Best Java code snippets using org.elasticsearch.index.mapper.ParsedDocument.rootDoc (Showing top 13 results out of 315)

How to use
rootDoc
method
in
org.elasticsearch.index.mapper.ParsedDocument