@Override public void process(final InputStream stream) throws IOException { try (final InputStream in = new BufferedInputStream(stream)) { TikaInputStream tikaStream = TikaInputStream.get(in); Metadata metadata = new Metadata(); if (filename != null && context.getProperty(USE_FILENAME_IN_DETECTION).asBoolean()) { metadata.add(TikaMetadataKeys.RESOURCE_NAME_KEY, filename); } // Get mime type MediaType mediatype = detector.detect(tikaStream, metadata); mimeTypeRef.set(mediatype.toString()); } } });
private void add(Property property, String value) { if (value != null) { metadata.add(property, value); } }
public static void addEvenIfNull(Property property, String value, Metadata metadata) { if (value == null) { value = ""; } metadata.add(property, value); }
private void addMetadataByString( Metadata metadata, String name, String value ) { // Add metadata if an appropriate value is passed if (value != null) { metadata.add( name, value ); } }
metadata.add(Metadata.CONTENT_TYPE, page.getContentType());
private static void addFirstChunk(List<Chunk> chunks, Property property, Metadata metadata) { if (chunks == null || chunks.size() < 1 || chunks.get(0) == null) { return; } metadata.add(property, chunks.get(0).toString()); }
private void parseText(Node text, Metadata metadata) { String lang = getFirstAttribute(text, "xml", "lang"); if (lang != null) { metadata.add("Language", lang); } }
@Override public void endEmbeddedDocument(ContentHandler contentHandler, Metadata metadata) throws SAXException { metadata.add(RecursiveParserWrapperHandler.TIKA_CONTENT, contentHandler.toString()); try { jsonWriter.add(metadata); } catch (IOException e) { throw new SAXException(e); } }
/** * Records details of a {@link Parser}'s failure to the * {@link Metadata}, so you can check what went wrong even if the * {@link Exception} wasn't immediately thrown (eg when several different * Parsers are used) */ public static void recordParserFailure(Parser parser, Throwable failure, Metadata metadata) { String trace = ExceptionUtils.getStackTrace(failure); metadata.add(EMBEDDED_EXCEPTION, trace); metadata.add(EMBEDDED_PARSER, getParserClassname(parser)); }
@Override public void endElement(String uri, String localName, String qName) throws SAXException { Property prop = getProperty(uri, localName); if (prop != null) { if (prop.isMultiValuePermitted()) { metadata.add(prop, buffer.toString()); } else { metadata.set(prop, buffer.toString()); } } buffer.setLength(0); }
public void handle(Directory directory, Metadata metadata) throws MetadataException { if (directory.containsTag(JpegCommentDirectory.TAG_COMMENT)) { metadata.add(TikaCoreProperties.COMMENTS, directory.getString(JpegCommentDirectory.TAG_COMMENT)); } } }
private void addMetadata(Metadata metadata, Property property, String value) { if (value != null) { String decoded = decode(value); if (property.isMultiValuePermitted() || metadata.get(property) == null) { metadata.add(property, decoded); } //silently skip adding property that already exists if multiple values are not permitted } }
TikaConfig config = TikaConfig.getDefaultConfig(); Detector detector = config.getDetector(); TikaInputStream stream = TikaInputStream.get(fileOrStream); Metadata metadata = new Metadata(); metadata.add(Metadata.RESOURCE_NAME_KEY, filenameWithExtension); MediaType mediaType = detector.detect(stream, metadata);
private static void addMetadata(String field, CSVRecord record, Metadata metadata) { if ((record ==null) || (record.size() <= 1)) { return; } for (int i = 1; i < record.size(); i++) { metadata.add(field, record.get(i)); } }
private void getMetaDataContact(Metadata metadata, DefaultMetadata defaultMetaData){ CheckedArrayList<ResponsibleParty> contactSet= (CheckedArrayList<ResponsibleParty>) defaultMetaData.getContacts(); for(ResponsibleParty rparty:contactSet){ if(rparty.getRole()!=null) metadata.add("ContactRole",rparty.getRole().name()); if(rparty.getOrganisationName()!=null) metadata.add("ContactPartyName-",rparty.getOrganisationName().toString()); } }
private void getMetaDataParentMetaDataTitle(Metadata metadata, DefaultMetadata defaultMetaData){ Citation parentMetaData=defaultMetaData.getParentMetadata(); if(parentMetaData!=null && parentMetaData.getTitle()!=null) metadata.add("ParentMetaDataTitle",parentMetaData.getTitle().toString()); }
private void getMetaDataDateInfo(Metadata metadata, DefaultMetadata defaultMetaData){ ArrayList<CitationDate> citationDateList= (ArrayList<CitationDate>) defaultMetaData.getDateInfo(); for(CitationDate c:citationDateList){ if(c.getDateType()!=null) { String date = DateUtils.formatDate(c.getDate()); metadata.add("DateInfo ",c.getDateType().name()+" "+date); } } }
@Test public void testToStringWithSingleEntry() { Metadata m = new Metadata(); m.add("key", "value1"); assertEquals("key=value1", m.toString()); } }
/** * TIKA-2460 Test loading of custom-mimetypes.xml from sys prop. */ @Test public void testExternalMimeTypes() throws Exception { System.setProperty(MimeTypesFactory.CUSTOM_MIMES_SYS_PROP, "src/test/resources/org/apache/tika/mime/external-mimetypes.xml"); MimeTypes mimeTypes = MimeTypes.getDefaultMimeTypes(new CustomClassLoader()); Metadata m = new Metadata(); m.add(TikaCoreProperties.RESOURCE_NAME_KEY, "test.external.mime.type"); assertEquals("external/mime-type", mimeTypes.detect(null, m).toString()); }