private List<FormDocument> filterForms(List<FormDocument> forms) { List<FormDocument> filtered = new ArrayList<>(forms.size()); for(FormDocument form : forms) { filtered.add(filter(form)); } return filtered; }
public ItemDocument filter(ItemDocument item) { return dataObjectFactory.getItemDocument( item.getEntityId(), filterMonoLingualTextValues(item.getLabels().values()), filterMonoLingualTextValues(item.getDescriptions().values()), filterMonoLingualTextValues(flatten(item.getAliases().values())), filterStatementGroups(item.getStatementGroups()), filterSiteLinks(item.getSiteLinks()), item.getRevisionId() ); }
public PropertyDocument filter(PropertyDocument property) { return dataObjectFactory.getPropertyDocument( property.getEntityId(), filterMonoLingualTextValues(property.getLabels().values()), filterMonoLingualTextValues(property.getDescriptions().values()), filterMonoLingualTextValues(flatten(property.getAliases().values())), filterStatementGroups(property.getStatementGroups()), property.getDatatype(), property.getRevisionId() ); }
/** * Constructor. * * @param entityDocumentProcessor * the processor to use on the filtered data * @param filter * the filter settings to be used */ public EntityDocumentProcessorFilter( EntityDocumentProcessor entityDocumentProcessor, DocumentDataFilter filter) { this.entityDocumentProcessor = entityDocumentProcessor; this.datamodelFilter = new DatamodelFilter(new DataObjectFactoryImpl(), filter); }
public LexemeDocument filter(LexemeDocument lexeme) { return dataObjectFactory.getLexemeDocument( lexeme.getEntityId(), lexeme.getLexicalCategory(), lexeme.getLanguage(), filterMonoLingualTextValues(lexeme.getLemmas().values()), filterStatementGroups(lexeme.getStatementGroups()), filterForms(lexeme.getForms()), filterSenses(lexeme.getSenses()), lexeme.getRevisionId() ); }
public SenseDocument filter(SenseDocument sense) { return dataObjectFactory.getSenseDocument( sense.getEntityId(), filterMonoLingualTextValues(sense.getGlosses().values()), filterStatementGroups(sense.getStatementGroups()), sense.getRevisionId() ); }
/** * Constructor. * * @param entityDocumentProcessor * the processor to use on the filtered data * @param filter * the filter settings to be used */ public EntityDocumentProcessorFilter( EntityDocumentProcessor entityDocumentProcessor, DocumentDataFilter filter) { this.entityDocumentProcessor = entityDocumentProcessor; this.datamodelFilter = new DatamodelFilter(new DataObjectFactoryImpl(), filter); }
public LexemeDocument filter(LexemeDocument lexeme) { return dataObjectFactory.getLexemeDocument( lexeme.getEntityId(), lexeme.getLexicalCategory(), lexeme.getLanguage(), filterMonoLingualTextValues(lexeme.getLemmas().values()), filterStatementGroups(lexeme.getStatementGroups()), filterForms(lexeme.getForms()), filterSenses(lexeme.getSenses()), lexeme.getRevisionId() ); }
public PropertyDocument filter(PropertyDocument property) { return dataObjectFactory.getPropertyDocument( property.getEntityId(), filterMonoLingualTextValues(property.getLabels().values()), filterMonoLingualTextValues(property.getDescriptions().values()), filterMonoLingualTextValues(flatten(property.getAliases().values())), filterStatementGroups(property.getStatementGroups()), property.getDatatype(), property.getRevisionId() ); }
public SenseDocument filter(SenseDocument sense) { return dataObjectFactory.getSenseDocument( sense.getEntityId(), filterMonoLingualTextValues(sense.getGlosses().values()), filterStatementGroups(sense.getStatementGroups()), sense.getRevisionId() ); }
private List<FormDocument> filterForms(List<FormDocument> forms) { List<FormDocument> filtered = new ArrayList<>(forms.size()); for(FormDocument form : forms) { filtered.add(filter(form)); } return filtered; }
this.datamodelFilter = new DatamodelFilter(new DataObjectFactoryImpl(), documentDataFilter);
public ItemDocument filter(ItemDocument item) { return dataObjectFactory.getItemDocument( item.getEntityId(), filterMonoLingualTextValues(item.getLabels().values()), filterMonoLingualTextValues(item.getDescriptions().values()), filterMonoLingualTextValues(flatten(item.getAliases().values())), filterStatementGroups(item.getStatementGroups()), filterSiteLinks(item.getSiteLinks()), item.getRevisionId() ); }
public FormDocument filter(FormDocument form) { return dataObjectFactory.getFormDocument( form.getEntityId(), filterMonoLingualTextValues(form.getRepresentations().values()), form.getGrammaticalFeatures(), filterStatementGroups(form.getStatementGroups()), form.getRevisionId() ); }
private List<SenseDocument> filterSenses(List<SenseDocument> senses) { List<SenseDocument> filtered = new ArrayList<>(senses.size()); for(SenseDocument sense : senses) { filtered.add(filter(sense)); } return filtered; }
/** * Constructor. Initializes various helper objects we use for the JSON * serialization, and opens the file that we want to write to. * * @throws IOException * if there is a problem opening the output file */ public JsonSerializationProcessor() throws IOException { // The filter is used to copy selected parts of the data. We use this // to remove some parts from the documents we serialize. DocumentDataFilter filter = new DocumentDataFilter(); // Only copy English labels, descriptions, and aliases: filter.setLanguageFilter(Collections.singleton("en")); // Only copy statements of some properties: Set<PropertyIdValue> propertyFilter = new HashSet<>(); propertyFilter.add(Datamodel.makeWikidataPropertyIdValue("P18")); // image propertyFilter.add(Datamodel.makeWikidataPropertyIdValue("P106")); // occupation propertyFilter.add(Datamodel.makeWikidataPropertyIdValue("P569")); // birthdate filter.setPropertyFilter(propertyFilter); // Do not copy any sitelinks: filter.setSiteLinkFilter(Collections.<String>emptySet()); this.datamodelFilter = new DatamodelFilter(new DataObjectFactoryImpl(), new DocumentDataFilter()); // The (compressed) file we write to. OutputStream outputStream = new GzipCompressorOutputStream( new BufferedOutputStream( ExampleHelpers .openExampleFileOuputStream(OUTPUT_FILE_NAME))); this.jsonSerializer = new JsonSerializer(outputStream); this.jsonSerializer.open(); }
public FormDocument filter(FormDocument form) { return dataObjectFactory.getFormDocument( form.getEntityId(), filterMonoLingualTextValues(form.getRepresentations().values()), form.getGrammaticalFeatures(), filterStatementGroups(form.getStatementGroups()), form.getRevisionId() ); }
private List<SenseDocument> filterSenses(List<SenseDocument> senses) { List<SenseDocument> filtered = new ArrayList<>(senses.size()); for(SenseDocument sense : senses) { filtered.add(filter(sense)); } return filtered; }
@Override public void processItemDocument(ItemDocument itemDocument) { entityDocumentProcessor.processItemDocument(datamodelFilter.filter(itemDocument)); }
@Override public void processLexemeDocument(LexemeDocument lexemeDocument) { entityDocumentProcessor.processLexemeDocument(datamodelFilter.filter(lexemeDocument)); }