private static DocumentWrapper buildFrom(DocumentDTO doc) { DocumentWrapper.Builder dw = DocumentWrapper.newBuilder(); String rowId = RowComposer.composeRow(doc); dw.setRowId(rowId);
MultiTypeParseResult mtpr=new MultiTypeParseResult(); if (documentMetadata!=null) { DocumentWrapper.Builder builder=DocumentWrapper.newBuilder(); builder.setDocumentMetadata(documentMetadata); if (mc!=null) {
DocumentWrapper.Builder dwb = DocumentWrapper.newBuilder(); dwb.setRowId(new String(row.getId())); if (dm != null) {
DocumentWrapper.Builder commonDocumentWrapper = DocumentWrapper.newBuilder(); commonDocumentWrapper.setDocumentMetadata(commonDocumentMetadata); commonDocumentWrapper.setRowId(doi);
.newBuilder(); documentWrapper.setDocumentMetadata(documentMetadata); documentWrapper.setRowId(doi);
public Tuple exec(Tuple input) throws IOException { if (input == null || input.size() != 3) { return null; } try{ String key = (String) input.get(0); DocumentWrapper dw = DocumentWrapper.parseFrom(((DataByteArray) input.get(1)).get()); String correctedDoi = (String) input.get(2); DocumentWrapper.Builder dwb = DocumentWrapper.newBuilder(dw); DocumentMetadata.Builder dmb = DocumentMetadata.newBuilder(dw.getDocumentMetadata()); BasicMetadata.Builder bmb = BasicMetadata.newBuilder(dmb.getBasicMetadata()); bmb.setDoi(correctedDoi); dmb.setBasicMetadata(bmb); dwb.setDocumentMetadata(dmb); Tuple ret = TupleFactory.getInstance().newTuple(); ret.append(key); ret.append(new DataByteArray(dwb.build().toByteArray())); return ret; }catch(Exception e){ logger.error("Error in processing input row:"+ StackTraceExtractor.getStackTrace(e), e); throw new IOException("Caught exception processing input row:\n" + StackTraceExtractor.getStackTrace(e)); } } }
@Override public boolean transform(DocumentProtos.Media media, String docNewId, MultiTypeParseResult dmBuider, DocumentProtos.MediaContainerOrBuilder mediaToCopy) { DocumentProtos.DocumentWrapperOrBuilder dwo=findWrapperForThisId(docNewId, dmBuider); DocumentProtos.DocumentWrapper.Builder dwb; if (dwo!=null) { dwb=(dwo instanceof DocumentProtos.DocumentWrapper.Builder)? (DocumentProtos.DocumentWrapper.Builder)dwo:((DocumentProtos.DocumentWrapper)dwo).toBuilder(); dmBuider.getDocuments().remove(dwo); } else { dwb=DocumentProtos.DocumentWrapper.newBuilder(); DocumentProtos.MediaContainer.Builder builder=dwb.getMediaContainerBuilder(); for (Media m:mediaToCopy.getMediaList()) { Media.Builder mb=m.toBuilder(); builder.addMedia(mb); } } boolean transform=transform(media, docNewId, dwb.getDocumentMetadataBuilder(),dwb); if (transform) { dpu.setIDFor(dwb, docNewId); dmBuider.add(dwb); } return transform; }
/** * Put metadata as pl.edu.icm.coansys.models.DocumentProtos.Media along with * content as java.util.List<pl.edu.icm.coansys.models.DocumentProtos.Media> * * @param rowId * @param metadata * @param content */ public void put(String rowId, Media metadata, List<Media> content) { final DocumentProtos.DocumentWrapper.Builder dwb = DocumentProtos.DocumentWrapper .newBuilder(); final DocumentProtos.MediaContainer.Builder mcb = DocumentProtos.MediaContainer .newBuilder(); dwb.setRowId(rowId); mcb.addMedia(metadata); addContent(content, mcb); dwb.setMediaContainer(mcb); put(dwb.build()); }
private DocumentWrapper prepareMetadataAndContent(final List<Row> rows) throws IOException { final DocumentWrapper documentWrapper = prepareDocumentWrapper(rows, HBaseConstant.FAMILY_METADATA , HBaseConstant.FAMILY_METADATA_DOCUMENT_QUALIFIER_PROTO); final DocumentWrapper documentWrapperContent = prepareDocumentWrapper(rows, HBaseConstant.FAMILY_CONTENT , HBaseConstant.FAMILY_CONTENT_QUALIFIER_PROTO); if (null != documentWrapper && null != documentWrapperContent) { final DocumentProtos.DocumentWrapper.Builder dwb = DocumentProtos.DocumentWrapper.newBuilder(); final DocumentProtos.MediaContainer.Builder mcb = DocumentProtos.MediaContainer.newBuilder(); dwb.setRowId(documentWrapper.getRowId()); mcb.addAllMedia(documentWrapper.getMediaContainer().getMediaList()); mcb.addAllMedia(documentWrapperContent.getMediaContainer().getMediaList()); dwb.setMediaContainer(mcb); return dwb.build(); } return null; }
@Override public Tuple exec(Tuple tuple) throws IOException { checkCorrectness(tuple); String rowId = (String) tuple.get(0); DataByteArray origDocDBA = (DataByteArray) tuple.get(1); DocumentWrapper.Builder dwb = DocumentWrapper.newBuilder(DocumentWrapper.parseFrom(origDocDBA.get())); dwb = merger.execute(tuple, 3, dwb); DataByteArray resultDocDBA = new DataByteArray(dwb.build().toByteArray()); Tuple result = TupleFactory.getInstance().newTuple(); result.append(rowId); result.append(resultDocDBA); return result; }
private DocumentWrapper documentWrapper(String id, String bwmeta) { final DocumentProtos.Media media = DocumentProtos.Media.newBuilder() .setKey("bwmeta2") .setMediaType("application/xml") .setContent(ByteString.copyFromUtf8(bwmeta)) .build(); final DocumentProtos.MediaContainer.Builder mediaContainer = DocumentProtos.MediaContainer.newBuilder() .addMedia(media); return DocumentProtos.DocumentWrapper.newBuilder() .setRowId(id) .setMediaContainer(mediaContainer) .build(); }
public DocumentWrapper.Builder mainBlockParsing(Tuple t) throws ExecException, InvalidProtocolBufferException{ docId = (String) t.get(2*mainGroupIndex); DataByteArray proto = (DataByteArray) t.get(2*mainGroupIndex+1); return DocumentWrapper.newBuilder(DocumentWrapper.parseFrom(proto.get())); } }
public static DocumentWrapper translate(DocumentDTO docDTO) { DocumentWrapper.Builder dw = DocumentWrapper.newBuilder(); dw.setRowId(RowComposer.composeRow(docDTO)); dw.setDocumentMetadata(docDTO.getDocumentMetadata()); dw.setMediaContainer(docDTO.getMediaConteiner()); return dw.build(); }
private DocumentProtos.DocumentWrapper.Builder prepareDocumentWrapperBuilder(final String newId_url , final DocumentProtos.MediaContainer.Builder mcb) { final DocumentProtos.DocumentWrapper.Builder dwb = DocumentProtos.DocumentWrapper.newBuilder(); dwb.setRowId(newId_url); dwb.setMediaContainer(mcb); return dwb; }
private DocumentWrapper convertMediaToBw2Proto(List<Media> mediaList, String documentKey) { final DocumentProtos.DocumentWrapper.Builder dwb = DocumentProtos.DocumentWrapper .newBuilder(); dwb.setRowId(documentKey); dwb.setMediaContainer(addMedia(mediaList)); return dwb.build(); }
/** * Returns the clone of the passed DocumentWrapper with filled {@link DocumentWrapper#getDocumentMetadata()} and {@link DocumentWrapper#getRowId()} only */ public static DocumentWrapper cloneDocumentMetadata(DocumentWrapper docWrapper) { return DocumentWrapper.newBuilder().setDocumentMetadata(docWrapper.getDocumentMetadata()).setRowId(docWrapper.getRowId()).build(); }