New implementation for Conflicts-With Scrutinizer (#2693)
part of #2354
This commit is contained in:
parent
f88c0e3657
commit
45fab05bf6
@ -27,10 +27,10 @@ import org.wikidata.wdtk.datamodel.interfaces.ItemIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.PropertyIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.QuantityValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Value;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Statement;
|
||||
|
||||
import java.util.List;
|
||||
import java.util.Map;
|
||||
import java.util.Set;
|
||||
import java.util.stream.Stream;
|
||||
|
||||
/**
|
||||
* An object that fetches constraints about properties.
|
||||
@ -53,7 +53,7 @@ public interface ConstraintFetcher {
|
||||
/**
|
||||
* Retrieves the property that is the inverse of a given property
|
||||
*
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to retrieve the inverse for
|
||||
* @return the pid of the inverse property
|
||||
*/
|
||||
@ -143,6 +143,17 @@ public interface ConstraintFetcher {
|
||||
*/
|
||||
boolean usableOnItems(PropertyIdValue pid);
|
||||
|
||||
/**
|
||||
* Gets the list of constraints of a particular type for a property
|
||||
*
|
||||
* @param pid
|
||||
* the property to retrieve the constraints for
|
||||
* @param qid
|
||||
* the type of the constraints
|
||||
* @return the stream of matching constraint statements
|
||||
*/
|
||||
Stream<Statement> getConstraintsByType(PropertyIdValue pid, String qid);
|
||||
|
||||
/**
|
||||
* Retrieves the lower bound of the range
|
||||
* required in difference-within-range constraint
|
||||
@ -165,7 +176,7 @@ public interface ConstraintFetcher {
|
||||
* Retrieves the lower value property for calculating the difference
|
||||
* required in difference-within-range constraint
|
||||
*
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to calculate difference with
|
||||
* @return the pid of the lower bound property
|
||||
*/
|
||||
@ -177,13 +188,4 @@ public interface ConstraintFetcher {
|
||||
*/
|
||||
boolean hasDiffWithinRange(PropertyIdValue pid);
|
||||
|
||||
/*
|
||||
* Returns the Map of all the conflicting pid and their item values
|
||||
*
|
||||
* @param pid:
|
||||
* the property having conflicts-with constraint
|
||||
* @return
|
||||
*/
|
||||
Map<PropertyIdValue, List<Value>> getParamConflictsWith(PropertyIdValue pid);
|
||||
|
||||
}
|
||||
|
@ -30,9 +30,7 @@ import org.wikidata.wdtk.datamodel.interfaces.*;
|
||||
|
||||
import java.util.ArrayList;
|
||||
import java.util.List;
|
||||
import java.util.Map;
|
||||
import java.util.Set;
|
||||
import java.util.HashMap;
|
||||
import java.util.stream.Collectors;
|
||||
import java.util.stream.Stream;
|
||||
|
||||
@ -97,10 +95,6 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
public static String ALLOWED_ITEM_TYPE_QID = "Q29934200";
|
||||
public static String ALLOWED_ENTITY_TYPES_PID = "P2305";
|
||||
|
||||
public static String CONFLICTS_WITH_CONSTRAINT_QID = "Q21502838";
|
||||
public static String CONFLICTS_WITH_PROPERTY_PID = "P2306";
|
||||
public static String ITEM_OF_PROPERTY_CONSTRAINT_PID = "P2305";
|
||||
|
||||
// The following constraints still need to be implemented:
|
||||
|
||||
public static String TYPE_CONSTRAINT_QID = "Q21503250";
|
||||
@ -279,9 +273,9 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
* Returns a single constraint for a particular type and a property, or null if
|
||||
* there is no such constraint
|
||||
*
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to retrieve the constraints for
|
||||
* @param qid:
|
||||
* @param qid
|
||||
* the type of the constraints
|
||||
* @return the list of qualifiers for the constraint, or null if it does not
|
||||
* exist
|
||||
@ -297,13 +291,14 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
/**
|
||||
* Gets the list of constraints of a particular type for a property
|
||||
*
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to retrieve the constraints for
|
||||
* @param qid:
|
||||
* @param qid
|
||||
* the type of the constraints
|
||||
* @return the stream of matching constraint statements
|
||||
*/
|
||||
protected Stream<Statement> getConstraintsByType(PropertyIdValue pid, String qid) {
|
||||
@Override
|
||||
public Stream<Statement> getConstraintsByType(PropertyIdValue pid, String qid) {
|
||||
Stream<Statement> allConstraints = getConstraintStatements(pid).stream()
|
||||
.filter(s -> s.getValue() != null && ((EntityIdValue) s.getValue()).getId().equals(qid))
|
||||
.filter(s -> !StatementRank.DEPRECATED.equals(s.getRank()));
|
||||
@ -314,7 +309,7 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
* Gets all the constraint statements for a given property
|
||||
*
|
||||
* @param pid
|
||||
* : the id of the property to retrieve the constraints for
|
||||
* the id of the property to retrieve the constraints for
|
||||
* @return the list of constraint statements
|
||||
*/
|
||||
protected List<Statement> getConstraintStatements(PropertyIdValue pid) {
|
||||
@ -332,9 +327,9 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
/**
|
||||
* Returns the values of a given property in qualifiers
|
||||
*
|
||||
* @param groups:
|
||||
* @param groups
|
||||
* the qualifiers
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to filter on
|
||||
* @return
|
||||
*/
|
||||
@ -373,7 +368,7 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
* Retrieves the lower value property for calculating the difference
|
||||
* required in difference-within-range constraint
|
||||
*
|
||||
* @param pid:
|
||||
* @param pid
|
||||
* the property to calculate difference with
|
||||
* @return the pid of the lower bound property
|
||||
*/
|
||||
@ -428,36 +423,4 @@ public class WikidataConstraintFetcher implements ConstraintFetcher {
|
||||
return null;
|
||||
}
|
||||
|
||||
/**
|
||||
* Returns the Map of all the conflicting pid and their item values
|
||||
*
|
||||
* @param pid:
|
||||
* the property having conflicts-with constraint
|
||||
* @return
|
||||
*/
|
||||
@Override
|
||||
public Map<PropertyIdValue, List<Value>> getParamConflictsWith(PropertyIdValue pid) {
|
||||
List<Statement> statementList = getConstraintsByType(pid, CONFLICTS_WITH_CONSTRAINT_QID).collect(Collectors.toList());
|
||||
Map<PropertyIdValue, List<Value>> propertyIdValueListMap = new HashMap<>();
|
||||
for (Statement statement : statementList) {
|
||||
List<SnakGroup> specs = statement.getClaim().getQualifiers();
|
||||
PropertyIdValue conflictingPid = null;
|
||||
List<Value> items = new ArrayList<>();
|
||||
for(SnakGroup group : specs) {
|
||||
for (Snak snak : group.getSnaks()) {
|
||||
if (group.getProperty().getId().equals(CONFLICTS_WITH_PROPERTY_PID)){
|
||||
conflictingPid = (PropertyIdValue) snak.getValue();
|
||||
}
|
||||
if (group.getProperty().getId().equals(ITEM_OF_PROPERTY_CONSTRAINT_PID)){
|
||||
items.add(snak.getValue());
|
||||
}
|
||||
}
|
||||
}
|
||||
if (conflictingPid != null) {
|
||||
propertyIdValueListMap.put(conflictingPid, items);
|
||||
}
|
||||
}
|
||||
|
||||
return propertyIdValueListMap;
|
||||
}
|
||||
}
|
||||
|
@ -3,18 +3,47 @@ package org.openrefine.wikidata.qa.scrutinizers;
|
||||
import org.openrefine.wikidata.qa.QAWarning;
|
||||
import org.openrefine.wikidata.updates.ItemUpdate;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.PropertyIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Snak;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.SnakGroup;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Statement;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Value;
|
||||
|
||||
import java.util.Set;
|
||||
import java.util.Map;
|
||||
import java.util.ArrayList;
|
||||
import java.util.HashMap;
|
||||
import java.util.HashSet;
|
||||
import java.util.List;
|
||||
import java.util.Map;
|
||||
import java.util.Set;
|
||||
import java.util.stream.Collectors;
|
||||
|
||||
public class ConflictsWithScrutinizer extends EditScrutinizer {
|
||||
|
||||
public static final String type = "having-conflicts-with-statements";
|
||||
public static String CONFLICTS_WITH_CONSTRAINT_QID = "Q21502838";
|
||||
public static String CONFLICTS_WITH_PROPERTY_PID = "P2306";
|
||||
public static String ITEM_OF_PROPERTY_CONSTRAINT_PID = "P2305";
|
||||
|
||||
class ConflictsWithConstraint {
|
||||
final PropertyIdValue conflictingPid;
|
||||
final List<Value> itemList;
|
||||
|
||||
ConflictsWithConstraint(Statement statement) {
|
||||
List<SnakGroup> specs = statement.getClaim().getQualifiers();
|
||||
PropertyIdValue pid = null;
|
||||
this.itemList = new ArrayList<>();
|
||||
for(SnakGroup group : specs) {
|
||||
for (Snak snak : group.getSnaks()) {
|
||||
if (group.getProperty().getId().equals(CONFLICTS_WITH_PROPERTY_PID)){
|
||||
pid = (PropertyIdValue) snak.getValue();
|
||||
}
|
||||
if (group.getProperty().getId().equals(ITEM_OF_PROPERTY_CONSTRAINT_PID)){
|
||||
this.itemList.add(snak.getValue());
|
||||
}
|
||||
}
|
||||
}
|
||||
this.conflictingPid = pid;
|
||||
}
|
||||
}
|
||||
|
||||
@Override
|
||||
public void scrutinize(ItemUpdate update) {
|
||||
@ -36,9 +65,12 @@ public class ConflictsWithScrutinizer extends EditScrutinizer {
|
||||
}
|
||||
|
||||
for(PropertyIdValue propertyId : propertyIdValueValueMap.keySet()){
|
||||
Map<PropertyIdValue, List<Value>> conflictingPropertyMap = _fetcher.getParamConflictsWith(propertyId);
|
||||
for (PropertyIdValue conflictingPid : conflictingPropertyMap.keySet()) {
|
||||
if (propertyIdValueValueMap.containsKey(conflictingPid) && raiseWarning(propertyIdValueValueMap, conflictingPid, conflictingPropertyMap)) {
|
||||
List<Statement> statementList = _fetcher.getConstraintsByType(propertyId, CONFLICTS_WITH_CONSTRAINT_QID).collect(Collectors.toList());
|
||||
for (Statement statement : statementList) {
|
||||
ConflictsWithConstraint constraint = new ConflictsWithConstraint(statement);
|
||||
PropertyIdValue conflictingPid = constraint.conflictingPid;
|
||||
List<Value> itemList = constraint.itemList;
|
||||
if (propertyIdValueValueMap.containsKey(conflictingPid) && raiseWarning(propertyIdValueValueMap, conflictingPid, itemList)) {
|
||||
QAWarning issue = new QAWarning(type, propertyId.getId()+conflictingPid.getId(), QAWarning.Severity.WARNING, 1);
|
||||
issue.setProperty("property_entity", propertyId);
|
||||
issue.setProperty("added_property_entity", conflictingPid);
|
||||
@ -46,15 +78,16 @@ public class ConflictsWithScrutinizer extends EditScrutinizer {
|
||||
addIssue(issue);
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
private boolean raiseWarning(Map<PropertyIdValue, Set<Value>> propertyIdValueValueMap, PropertyIdValue conflictingPid, Map<PropertyIdValue, List<Value>> conflictingPropertyMap) {
|
||||
if (conflictingPropertyMap.get(conflictingPid).isEmpty()){
|
||||
private boolean raiseWarning(Map<PropertyIdValue, Set<Value>> propertyIdValueValueMap, PropertyIdValue conflictingPid, List<Value> itemList) {
|
||||
if (itemList.isEmpty()){
|
||||
return true;
|
||||
}
|
||||
|
||||
for (Value value : conflictingPropertyMap.get(conflictingPid)) {
|
||||
for (Value value : itemList) {
|
||||
if (propertyIdValueValueMap.get(conflictingPid).contains(value)){
|
||||
return true;
|
||||
}
|
||||
|
@ -24,19 +24,25 @@
|
||||
package org.openrefine.wikidata.qa;
|
||||
|
||||
import org.wikidata.wdtk.datamodel.helpers.Datamodel;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Claim;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.EntityIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.ItemIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.PropertyIdValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.QuantityValue;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Reference;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Snak;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.SnakGroup;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Statement;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.StatementRank;
|
||||
import org.wikidata.wdtk.datamodel.interfaces.Value;
|
||||
|
||||
import java.math.BigDecimal;
|
||||
import java.util.Arrays;
|
||||
import java.util.Collections;
|
||||
import java.util.Set;
|
||||
import java.util.Map;
|
||||
import java.util.HashMap;
|
||||
import java.util.List;
|
||||
import java.util.Set;
|
||||
import java.util.stream.Collectors;
|
||||
import java.util.stream.Stream;
|
||||
|
||||
public class MockConstraintFetcher implements ConstraintFetcher {
|
||||
|
||||
@ -211,10 +217,36 @@ public class MockConstraintFetcher implements ConstraintFetcher {
|
||||
return true;
|
||||
}
|
||||
|
||||
public Map<PropertyIdValue, List<Value>> getParamConflictsWith(PropertyIdValue pid) {
|
||||
Map<PropertyIdValue, List<Value>> propertyIdValueListMap = new HashMap<>();
|
||||
List<Value> items = Arrays.asList(conflictingStatementValue, null);
|
||||
propertyIdValueListMap.put(conflictingStatementPid, items);
|
||||
return propertyIdValueListMap;
|
||||
@Override
|
||||
public Stream<Statement> getConstraintsByType(PropertyIdValue pid, String qid) {
|
||||
EntityIdValue entityIdValue = Datamodel.makeWikidataItemIdValue("Q21502838");
|
||||
PropertyIdValue propertyIdValue = Datamodel.makeWikidataPropertyIdValue("P2302");
|
||||
Snak snak = Datamodel.makeValueSnak(propertyIdValue,entityIdValue);
|
||||
|
||||
PropertyIdValue property = Datamodel.makeWikidataPropertyIdValue("P2306");
|
||||
Value propertyValue = Datamodel.makeWikidataPropertyIdValue("P31");
|
||||
Snak snak1 = Datamodel.makeValueSnak(property, propertyValue);
|
||||
List<Snak> group1 = Collections.singletonList(snak1);
|
||||
|
||||
PropertyIdValue item = Datamodel.makeWikidataPropertyIdValue("P2305");
|
||||
Value itemValue = Datamodel.makeWikidataItemIdValue("Q5");
|
||||
Snak snak2 = Datamodel.makeValueSnak(item, itemValue);
|
||||
List<Snak> group2 = Collections.singletonList(snak2);
|
||||
|
||||
SnakGroup snakGroup1 = Datamodel.makeSnakGroup(group1);
|
||||
SnakGroup snakGroup2 = Datamodel.makeSnakGroup(group2);
|
||||
|
||||
List<SnakGroup> listSnakGroup = Arrays.asList(snakGroup1, snakGroup2);
|
||||
Claim claim = Datamodel.makeClaim(entityIdValue, snak, listSnakGroup);
|
||||
|
||||
Reference reference = Datamodel.makeReference(listSnakGroup);
|
||||
List<Reference> referenceList = Collections.singletonList(reference);
|
||||
|
||||
Statement statement = Datamodel.makeStatement(claim, referenceList, StatementRank.NORMAL, "P2302$77BD7FE4-C051-4776-855C-543F0CE697D0");
|
||||
List<Statement> statements = Collections.singletonList(statement);
|
||||
|
||||
return statements.stream()
|
||||
.filter(s -> s.getValue() != null && ((EntityIdValue) s.getValue()).getId().equals(qid))
|
||||
.filter(s -> !StatementRank.DEPRECATED.equals(s.getRank()));
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user