@Override protected void map(Writable key, BytesWritable value, Context context) throws IOException, InterruptedException { Configuration conf = context.getConfiguration(); String extractionOption = conf.get(EXTRACTION_OPTION); String lang = conf.get(EXTRACTION_LANGUAGE); DocumentWrapper docWrapper = DocumentProtos.DocumentWrapper.parseFrom(value.copyBytes()); RakeExtractor rakeExtractor = new RakeExtractor(docWrapper, extractionOption, lang); List<String> keywords = rakeExtractor.getKeywords(); if (keywords.size() > 0) { String docId = docWrapper.getDocumentMetadata().getKey(); DocumentProtos.KeywordsList.Builder kwdBuilder = DocumentProtos.KeywordsList.newBuilder(); DocumentProtos.ProvenanceInfo.Builder provenanceBuilder = DocumentProtos.ProvenanceInfo.newBuilder(); DocumentProtos.ProvenanceInfo.SingleProvenanceInfo.Builder singleProvenanceBuilder = DocumentProtos.ProvenanceInfo.SingleProvenanceInfo.newBuilder(); singleProvenanceBuilder.setLastModificationDate(new Date().getTime()); singleProvenanceBuilder.setLastModificationMarkerId(ALGORITHM_NAME); provenanceBuilder.setCurrentProvenance(singleProvenanceBuilder); kwdBuilder.setProvenance(provenanceBuilder); kwdBuilder.addAllKeywords(keywords); context.write(new Text(docId), new BytesWritable(kwdBuilder.build().toByteArray())); } } }
private ProvenanceInfo.Builder createProvenance() { ProvenanceInfo.Builder pb = ProvenanceInfo.newBuilder(); ProvenanceInfo.SingleProvenanceInfo.Builder spb = ProvenanceInfo.SingleProvenanceInfo.newBuilder(); spb.setLastModificationMarkerId(CoansysModulesConstants.COANSYS_MODULE_ID_DISAMBIGUATION_AUTHOR); spb.setLastModificationDate(new Date().getTime()); pb.setCurrentProvenance(spb); return pb; }
nlmMediaBuilder.setMediaType(ProtoConstants.mediaTypeNlm); DocumentProtos.ProvenanceInfo.Builder provenanceBuilder = DocumentProtos.ProvenanceInfo.newBuilder(); DocumentProtos.ProvenanceInfo.SingleProvenanceInfo.Builder signleProvenance = DocumentProtos.ProvenanceInfo.SingleProvenanceInfo.newBuilder();
ProvenanceInfo.Builder provenanceBuilder = ProvenanceInfo.newBuilder(); ProvenanceInfo.SingleProvenanceInfo.Builder singleProvenanceBuilder = ProvenanceInfo.SingleProvenanceInfo.newBuilder(); singleProvenanceBuilder
.newBuilder(); ProvenanceInfo.SingleProvenanceInfo.Builder singleProvenanceBuilder = ProvenanceInfo.SingleProvenanceInfo .newBuilder();