mediaBuilder.setKey(pdfInZip); mediaBuilder.setContent(ByteString.copyFrom(pdfByteArray)); mediaBuilder.setCollection(collection); mediaBuilder.setMediaType(ProtoConstants.mediaTypePdf); mediaBuilder.setSourcePath(dataPath + "/" + archive.getZipFilePath() + "#" + pdfInZip); mediaBuilder.setSourceFilesize(pdfByteArray.length); nextItem.addMedia(mediaBuilder.build()); nextItem.setKey(pdfInZip); nextItem.setCollection(collection);
if (m!=null) { DocumentProtos.Media.Builder mediaBuild=DocumentProtos.Media.newBuilder(); mediaBuild.setKey(CrossrefConstants.KEY_CROSSREF_UNIXREF_RECORD); mediaBuild.setMediaType(CrossrefConstants.TYPE_CROSSREF_UNIXREF_RECORD); mediaBuild.setContent(ByteString.copyFrom(m)); build.getMediaContainerBuilder().addMedia(mediaBuild); if (m!=null) { DocumentProtos.Media.Builder mediaBuild=DocumentProtos.Media.newBuilder(); mediaBuild.setKey(CrossrefConstants.KEY_CROSSREF_JSON_RECORD); mediaBuild.setMediaType(CrossrefConstants.TYPE_CROSSREF_JSON_RECORD); mediaBuild.setContent(ByteString.copyFrom(m)); build.getMediaContainerBuilder().addMedia(mediaBuild);
nlmMediaBuilder.setCollection(media.getCollection()); nlmMediaBuilder.setKey(media.getKey()); nlmMediaBuilder.setSourceFilesize(nlmString.length()); nlmMediaBuilder.setContent(ByteString.copyFromUtf8(nlmString)); nlmMediaBuilder.setMediaType(ProtoConstants.mediaTypeNlm); signleProvenance.setLastModificationMarkerId("Coansys NLM extraction (CERMINE)"); provenanceBuilder.setCurrentProvenance(signleProvenance); nlmMediaBuilder.setProvenance(provenanceBuilder); context.write(new Text(media.getKey()), new BytesWritable(nlmMediaBuilder.build().toByteArray())); } catch (AnalysisException ex) { logger.warn("cannot process PDF " + media.getSourcePath(), ex);
mediaBuilder.setKey(docDTO.getKey()); mediaBuilder.setMediaType(mediaType); byte[] content = IOUtils.toByteArray(mediaIS); mediaBuilder.setContent(ByteString.copyFrom(content)); mediaBuilder.setSourcePath(currentZipArchive.getZipFilePath() + "#" + foundPath); mediaBuilder.setSourceFilesize(content.length); docDTO.addMedia(mediaBuilder.build()); docDTO.addMediaType(mediaType); mediaIS.close();
protected void addBwmetaMedia(List<YExportable> bwmeta, String docNewId, DocumentProtos.DocumentWrapper.Builder builder) throws UnsupportedEncodingException { for (YExportable ex : bwmeta) { if (ex instanceof YElement) { if (((YElement) ex).getStructure(HierarchyWithLevelIds.EXT_HIERARCHY_JOURNAL) != null && HierarchyWithLevelIds.EXT_LEVEL_JOURNAL_ARTICLE.equalsIgnoreCase(((YElement) ex) .getStructure(HierarchyWithLevelIds.EXT_HIERARCHY_JOURNAL).getCurrent().getLevel())) { if (NON_ID_CHARS.matcher(ex.getId()).find()) { String nid = docNewId; nid = nid.replaceAll("[^a-zA-Z0-9\\-_]", "_"); ((YElement) ex).setId(nid); } } else { if (NON_ID_CHARS.matcher(ex.getId()).find()) { String nid = ex.getId(); nid = nid.replaceAll("[^a-zA-Z0-9\\-_]", "_"); ((YElement) ex).setId(nid); } } } } String bwmetas = ywriter.write(bwmeta); builder.getMediaContainerBuilder().addMediaBuilder(). setKey(BWMeta2Constants.KEY_BWMETA2_RECORD). setMediaType(BWMeta2Constants.TYPE_BWMETA2_RECORD). setContent(ByteString.copyFrom(bwmetas.getBytes("utf-8"))); }
private DocumentProtos.Media.Builder prepareMedia(final byte[] valueBytes, final String recordKey , final String recordValue) { final DocumentProtos.Media.Builder mb = DocumentProtos.Media.newBuilder(); mb.setKey(recordKey); mb.setMediaType(recordValue); mb.setContent(ByteString.copyFrom(valueBytes)); return mb; } }
private Media convertAttachmentsToMedia(PublicationAttachment attachment) { DocumentProtos.Media.Builder mb = DocumentProtos.Media.newBuilder(); mb.setKey(attachment.getKey()); mb.setMediaType(attachment.getMimeType()); mb.setContent(ByteString.copyFrom(readBytes(attachment.getData()))); Media m2 = mb.build(); return m2; }
private Media convertBwmetaToMedia(PublicationData publication) { DocumentProtos.Media.Builder mb = DocumentProtos.Media.newBuilder(); mb.setKey(publication.getPublicationMetadataKey()); mb.setMediaType(publication.getPublicationMetadataFormat()); mb.setContent(ByteString.copyFrom(readBytes(publication .getPublicationMetadata()))); Media m = mb.build(); return m; }
private DocumentWrapper documentWrapper(String id, String bwmeta) { final DocumentProtos.Media media = DocumentProtos.Media.newBuilder() .setKey("bwmeta2") .setMediaType("application/xml") .setContent(ByteString.copyFromUtf8(bwmeta)) .build(); final DocumentProtos.MediaContainer.Builder mediaContainer = DocumentProtos.MediaContainer.newBuilder() .addMedia(media); return DocumentProtos.DocumentWrapper.newBuilder() .setRowId(id) .setMediaContainer(mediaContainer) .build(); }