Implementation of UseValuesAsIdentifiers operation and command
This commit is contained in:
parent
ec3e9ab1e9
commit
2a68e761cb
@ -0,0 +1,31 @@
|
||||
package com.google.refine.commands.recon;
|
||||
|
||||
import javax.servlet.http.HttpServletRequest;
|
||||
|
||||
import org.json.JSONObject;
|
||||
|
||||
import com.google.refine.browsing.EngineConfig;
|
||||
import com.google.refine.commands.EngineDependentCommand;
|
||||
import com.google.refine.model.AbstractOperation;
|
||||
import com.google.refine.model.Project;
|
||||
import com.google.refine.model.ReconCandidate;
|
||||
import com.google.refine.model.recon.StandardReconConfig;
|
||||
import com.google.refine.operations.recon.ReconMatchSpecificTopicOperation;
|
||||
import com.google.refine.operations.recon.ReconUseValuesAsIdentifiersOperation;
|
||||
|
||||
public class ReconUseValuesAsIdentifiersCommand extends EngineDependentCommand {
|
||||
@Override
|
||||
protected AbstractOperation createOperation(Project project,
|
||||
HttpServletRequest request, EngineConfig engineConfig) throws Exception {
|
||||
|
||||
String columnName = request.getParameter("columnName");
|
||||
|
||||
return new ReconUseValuesAsIdentifiersOperation(
|
||||
engineConfig,
|
||||
columnName,
|
||||
request.getParameter("service"),
|
||||
request.getParameter("identifierSpace"),
|
||||
request.getParameter("schemaSpace")
|
||||
);
|
||||
}
|
||||
}
|
@ -0,0 +1,157 @@
|
||||
package com.google.refine.operations.recon;
|
||||
|
||||
import java.util.Collections;
|
||||
import java.util.List;
|
||||
import java.util.Properties;
|
||||
|
||||
import org.json.JSONException;
|
||||
import org.json.JSONObject;
|
||||
import org.json.JSONWriter;
|
||||
|
||||
import com.fasterxml.jackson.annotation.JsonIgnore;
|
||||
import com.fasterxml.jackson.annotation.JsonProperty;
|
||||
|
||||
import com.google.refine.browsing.EngineConfig;
|
||||
import com.google.refine.browsing.RowVisitor;
|
||||
import com.google.refine.expr.ExpressionUtils;
|
||||
import com.google.refine.history.Change;
|
||||
import com.google.refine.model.Cell;
|
||||
import com.google.refine.model.Column;
|
||||
import com.google.refine.model.Project;
|
||||
import com.google.refine.model.Recon;
|
||||
import com.google.refine.model.Recon.Judgment;
|
||||
import com.google.refine.model.ReconCandidate;
|
||||
import com.google.refine.model.Row;
|
||||
import com.google.refine.model.changes.CellChange;
|
||||
import com.google.refine.model.changes.ReconChange;
|
||||
import com.google.refine.model.recon.StandardReconConfig;
|
||||
import com.google.refine.operations.EngineDependentMassCellOperation;
|
||||
import com.google.refine.operations.OperationRegistry;
|
||||
|
||||
public class ReconUseValuesAsIdentifiersOperation extends EngineDependentMassCellOperation {
|
||||
|
||||
@JsonProperty("identifierSpace")
|
||||
protected String identifierSpace;
|
||||
@JsonProperty("schemaSpace")
|
||||
protected String schemaSpace;
|
||||
@JsonProperty("service")
|
||||
protected String service;
|
||||
|
||||
@JsonIgnore
|
||||
protected StandardReconConfig reconConfig;
|
||||
|
||||
public ReconUseValuesAsIdentifiersOperation(
|
||||
EngineConfig engineConfig,
|
||||
String columnName,
|
||||
String service,
|
||||
String identifierSpace,
|
||||
String schemaSpace) {
|
||||
super(engineConfig, columnName, false);
|
||||
this.service = service;
|
||||
this.identifierSpace = identifierSpace;
|
||||
this.schemaSpace = schemaSpace;
|
||||
this.reconConfig = new StandardReconConfig(service, identifierSpace, schemaSpace, null, null, true, Collections.emptyList());
|
||||
}
|
||||
|
||||
static public ReconUseValuesAsIdentifiersOperation reconstruct(JSONObject obj) throws Exception {
|
||||
JSONObject engineConfig = obj.getJSONObject("engineConfig");
|
||||
return new ReconUseValuesAsIdentifiersOperation(
|
||||
EngineConfig.reconstruct(engineConfig),
|
||||
obj.getString("columnName"),
|
||||
obj.getString("service"),
|
||||
obj.getString("identifierSpace"),
|
||||
obj.getString("schemaSpace")
|
||||
);
|
||||
}
|
||||
|
||||
@Override
|
||||
public void write(JSONWriter writer, Properties options)
|
||||
throws JSONException {
|
||||
writer.object();
|
||||
writer.key("op"); writer.value(OperationRegistry.s_opClassToName.get(this.getClass()));
|
||||
writer.key("description"); writer.value(getBriefDescription(null));
|
||||
writer.key("engineConfig"); getEngineConfig().write(writer, options);
|
||||
writer.key("columnName"); writer.value(_columnName);
|
||||
writer.key("service"); writer.value(service);
|
||||
writer.key("schemaSpace"); writer.value(schemaSpace);
|
||||
writer.key("identifierSpace"); writer.value(identifierSpace);
|
||||
writer.endObject();
|
||||
}
|
||||
|
||||
@Override
|
||||
public String getBriefDescription(Project project) {
|
||||
return "Use values as reconciliation identifiers in column " + _columnName;
|
||||
}
|
||||
|
||||
@Override
|
||||
protected RowVisitor createRowVisitor(Project project, List<CellChange> cellChanges, long historyEntryID)
|
||||
throws Exception {
|
||||
Column column = project.columnModel.getColumnByName(_columnName);
|
||||
|
||||
return new RowVisitor() {
|
||||
int cellIndex;
|
||||
List<CellChange> cellChanges;
|
||||
long historyEntryID;
|
||||
|
||||
public RowVisitor init(int cellIndex, List<CellChange> cellChanges, long historyEntryID) {
|
||||
this.cellIndex = cellIndex;
|
||||
this.cellChanges = cellChanges;
|
||||
this.historyEntryID = historyEntryID;
|
||||
return this;
|
||||
}
|
||||
|
||||
@Override
|
||||
public void start(Project project) {
|
||||
// nothing to do
|
||||
}
|
||||
|
||||
@Override
|
||||
public void end(Project project) {
|
||||
// nothing to do
|
||||
}
|
||||
|
||||
@Override
|
||||
public boolean visit(Project project, int rowIndex, Row row) {
|
||||
Cell cell = row.getCell(cellIndex);
|
||||
if (cell != null && ExpressionUtils.isNonBlankData(cell.value)) {
|
||||
String id = cell.value.toString();
|
||||
|
||||
ReconCandidate match = new ReconCandidate(id, id, new String[0], 100);
|
||||
Recon newRecon = reconConfig.createNewRecon(historyEntryID);
|
||||
newRecon.match = match;
|
||||
newRecon.candidates = Collections.singletonList(match);
|
||||
newRecon.matchRank = -1;
|
||||
newRecon.judgment = Judgment.Matched;
|
||||
newRecon.judgmentAction = "mass";
|
||||
newRecon.judgmentBatchSize = 1;
|
||||
|
||||
Cell newCell = new Cell(
|
||||
cell.value,
|
||||
newRecon
|
||||
);
|
||||
|
||||
CellChange cellChange = new CellChange(rowIndex, cellIndex, cell, newCell);
|
||||
cellChanges.add(cellChange);
|
||||
}
|
||||
return false;
|
||||
}
|
||||
}.init(column.getCellIndex(), cellChanges, historyEntryID);
|
||||
}
|
||||
|
||||
@Override
|
||||
protected String createDescription(Column column, List<CellChange> cellChanges) {
|
||||
return "Use values as reconciliation identifiers for "+ cellChanges.size() +
|
||||
" cells in column " + column.getName();
|
||||
}
|
||||
|
||||
@Override
|
||||
protected Change createChange(Project project, Column column, List<CellChange> cellChanges) {
|
||||
return new ReconChange(
|
||||
cellChanges,
|
||||
_columnName,
|
||||
reconConfig,
|
||||
null
|
||||
);
|
||||
}
|
||||
|
||||
}
|
@ -127,6 +127,7 @@ function registerCommands() {
|
||||
RS.registerCommand(module, "recon-clear-one-cell", new Packages.com.google.refine.commands.recon.ReconClearOneCellCommand());
|
||||
RS.registerCommand(module, "recon-clear-similar-cells", new Packages.com.google.refine.commands.recon.ReconClearSimilarCellsCommand());
|
||||
RS.registerCommand(module, "recon-copy-across-columns", new Packages.com.google.refine.commands.recon.ReconCopyAcrossColumnsCommand());
|
||||
RS.registerCommand(module, "recon-use-values-as-identifiers", new Packages.com.google.refine.commands.recon.ReconUseValuesAsIdentifiersCommand());
|
||||
RS.registerCommand(module, "preview-extend-data", new Packages.com.google.refine.commands.recon.PreviewExtendDataCommand());
|
||||
RS.registerCommand(module, "extend-data", new Packages.com.google.refine.commands.recon.ExtendDataCommand());
|
||||
|
||||
@ -190,6 +191,7 @@ function registerOperations() {
|
||||
OR.registerOperation(module, "recon-clear-similar-cells", Packages.com.google.refine.operations.recon.ReconClearSimilarCellsOperation);
|
||||
OR.registerOperation(module, "recon-copy-across-columns", Packages.com.google.refine.operations.recon.ReconCopyAcrossColumnsOperation);
|
||||
OR.registerOperation(module, "extend-reconciled-data", Packages.com.google.refine.operations.recon.ExtendDataOperation);
|
||||
OR.registerOperation(module, "recon-use-values-as-identifiers", Packages.com.google.refine.operations.recon.ReconUseValuesAsIdentifiersOperation);
|
||||
}
|
||||
|
||||
function registerImporting() {
|
||||
|
Loading…
Reference in New Issue
Block a user