Add option to include raw templates as cells

This commit is contained in:
Antonin Delpeuch 2017-08-25 14:28:30 +01:00
parent 554b75fa7b
commit 0a00fd9318
4 changed files with 47 additions and 5 deletions

View File

@ -19,6 +19,9 @@ import org.sweble.wikitext.parser.nodes.WtItalics;
import org.sweble.wikitext.parser.nodes.WtNewline; import org.sweble.wikitext.parser.nodes.WtNewline;
import org.sweble.wikitext.parser.nodes.WtNode; import org.sweble.wikitext.parser.nodes.WtNode;
import org.sweble.wikitext.parser.nodes.WtSection; import org.sweble.wikitext.parser.nodes.WtSection;
import org.sweble.wikitext.parser.nodes.WtTemplate;
import org.sweble.wikitext.parser.nodes.WtTemplateArgument;
import org.sweble.wikitext.parser.nodes.WtTemplateArguments;
import org.sweble.wikitext.parser.nodes.WtText; import org.sweble.wikitext.parser.nodes.WtText;
import org.sweble.wikitext.parser.nodes.WtInternalLink; import org.sweble.wikitext.parser.nodes.WtInternalLink;
import org.sweble.wikitext.parser.nodes.WtExternalLink; import org.sweble.wikitext.parser.nodes.WtExternalLink;
@ -77,6 +80,7 @@ public class WikitextImporter extends TabularImportingParserBase {
JSONUtilities.safePut(options, "guessCellValueTypes", false); JSONUtilities.safePut(options, "guessCellValueTypes", false);
JSONUtilities.safePut(options, "blankSpanningCells", true); JSONUtilities.safePut(options, "blankSpanningCells", true);
JSONUtilities.safePut(options, "includeRawTemplates", false);
JSONUtilities.safePut(options, "wikiUrl", "https://en.wikipedia.org/wiki/"); JSONUtilities.safePut(options, "wikiUrl", "https://en.wikipedia.org/wiki/");
return options; return options;
@ -125,6 +129,7 @@ public class WikitextImporter extends TabularImportingParserBase {
private List<String> currentRow; private List<String> currentRow;
private boolean blankSpanningCells; private boolean blankSpanningCells;
private boolean includeRawTemplates;
private int rowId; private int rowId;
private List<SpanningCell> spanningCells; private List<SpanningCell> spanningCells;
@ -138,8 +143,9 @@ public class WikitextImporter extends TabularImportingParserBase {
private int spanningCellIdx; private int spanningCellIdx;
private List<String> internalLinksInCell; private List<String> internalLinksInCell;
public WikitextTableVisitor(boolean blankSpanningCells) { public WikitextTableVisitor(boolean blankSpanningCells, boolean includeRawTemplates) {
this.blankSpanningCells = blankSpanningCells; this.blankSpanningCells = blankSpanningCells;
this.includeRawTemplates = includeRawTemplates;
caption = null; caption = null;
header = new ArrayList<String>(); header = new ArrayList<String>();
rows = new ArrayList<List<String>>(); rows = new ArrayList<List<String>>();
@ -165,7 +171,7 @@ public class WikitextImporter extends TabularImportingParserBase {
public void visit(WtNode e) { public void visit(WtNode e) {
// Ignore other nodes // Ignore other nodes
// System.out.println(e.getNodeName()); System.out.println(e.getNodeName());
} }
/* Table handling */ /* Table handling */
@ -343,7 +349,11 @@ public class WikitextImporter extends TabularImportingParserBase {
} }
public void visit(WtName e) { public void visit(WtName e) {
currentXmlAttr = e.getAsString(); try {
currentXmlAttr = e.getAsString();
} catch (UnsupportedOperationException _) {
currentXmlAttr = null;
}
} }
public void visit(WtValue e) { public void visit(WtValue e) {
@ -352,7 +362,6 @@ public class WikitextImporter extends TabularImportingParserBase {
/* Link management */ /* Link management */
public void visit(WtInternalLink e) { public void visit(WtInternalLink e) {
currentInternalLink = e.getTarget().getAsString(); currentInternalLink = e.getTarget().getAsString();
internalLinksInCell.add(currentInternalLink); internalLinksInCell.add(currentInternalLink);
@ -396,6 +405,29 @@ public class WikitextImporter extends TabularImportingParserBase {
// already handled, in WtExternalLink, added here for clarity // already handled, in WtExternalLink, added here for clarity
} }
/* Templates */
public void visit(WtTemplate e) {
if (includeRawTemplates) {
writeText("{{"+e.getName().getAsString());
WtTemplateArguments args = e.getArgs();
for (int i = 0; i != args.size(); i++) {
writeText("|");
iterate(args.get(i));
}
writeText("}}");
}
}
public void visit(WtTemplateArgument e) {
writeText("|");
if(e.hasName()) {
writeText(e.getName().getAsString());
writeText("=");
}
iterate(e.getValue());
}
/* Content blocks */ /* Content blocks */
public void visit(WtParsedWikitextPage e) { public void visit(WtParsedWikitextPage e) {
@ -546,7 +578,8 @@ public class WikitextImporter extends TabularImportingParserBase {
// Compile the retrieved page // Compile the retrieved page
boolean blankSpanningCells = JSONUtilities.getBoolean(options, "blankSpanningCells", true); boolean blankSpanningCells = JSONUtilities.getBoolean(options, "blankSpanningCells", true);
final WikitextTableVisitor vs = new WikitextTableVisitor(blankSpanningCells); boolean includeRawTemplates = JSONUtilities.getBoolean(options, "includeRawTemplates", false);
final WikitextTableVisitor vs = new WikitextTableVisitor(blankSpanningCells, includeRawTemplates);
vs.go(parsedArticle); vs.go(parsedArticle);
WikiTableDataReader dataReader = new WikiTableDataReader(vs); WikiTableDataReader dataReader = new WikiTableDataReader(vs);

View File

@ -114,6 +114,7 @@
"store-blank": "Store blank rows", "store-blank": "Store blank rows",
"store-nulls": "Store blank cells as nulls", "store-nulls": "Store blank cells as nulls",
"blank-spanning-cells": "Pad cells spanning over multiple rows or columns with nulls", "blank-spanning-cells": "Pad cells spanning over multiple rows or columns with nulls",
"include-raw-templates": "Include raw templates as wikicode",
"wiki-base-url": "Reconcile to wiki with base URL:", "wiki-base-url": "Reconcile to wiki with base URL:",
"invalid-wikitext": "No table could be parsed. Are you sure this is a valid wiki table?", "invalid-wikitext": "No table could be parsed. Are you sure this is a valid wiki table?",
"store-source": "Store file source <br/>(file names, URLs)<br/>in each row", "store-source": "Store file source <br/>(file names, URLs)<br/>in each row",

View File

@ -13,6 +13,8 @@
<td><label for="$blank-spanning-cells" id="or-import-blankSpanningCells"></label></td></tr> <td><label for="$blank-spanning-cells" id="or-import-blankSpanningCells"></label></td></tr>
<tr><td width="1%"><input type="checkbox" bind="storeBlankRowsCheckbox" id="$store-blank-rows" /></td> <tr><td width="1%"><input type="checkbox" bind="storeBlankRowsCheckbox" id="$store-blank-rows" /></td>
<td colspan="2"><label for="$store-blank-rows" id="or-import-blank"></label></td></tr> <td colspan="2"><label for="$store-blank-rows" id="or-import-blank"></label></td></tr>
<tr><td width="1%"><input type="checkbox" bind="includeRawTemplatesCheckbox" id="$include-raw-templates" /></td>
<td colspan="2"><label for="$include-raw-templates" id="or-import-includeRawTemplates"></label></td></tr>
<tr><td width="1%"><input type="checkbox" bind="storeBlankCellsAsNullsCheckbox" id="$store-blank-cells" /></td> <tr><td width="1%"><input type="checkbox" bind="storeBlankCellsAsNullsCheckbox" id="$store-blank-cells" /></td>
<td colspan="2"><label for="$store-blank-cells" id="or-import-null"></label></td></tr> <td colspan="2"><label for="$store-blank-cells" id="or-import-null"></label></td></tr>

View File

@ -87,6 +87,7 @@ Refine.WikitextParserUI.prototype.getOptions = function() {
} }
options.storeBlankRows = this._optionContainerElmts.storeBlankRowsCheckbox[0].checked; options.storeBlankRows = this._optionContainerElmts.storeBlankRowsCheckbox[0].checked;
options.blankSpanningCells = this._optionContainerElmts.blankSpanningCellsCheckbox[0].checked; options.blankSpanningCells = this._optionContainerElmts.blankSpanningCellsCheckbox[0].checked;
options.includeRawTemplates = this._optionContainerElmts.includeRawTemplatesCheckbox[0].checked;
options.guessCellValueTypes = this._optionContainerElmts.guessCellValueTypesCheckbox[0].checked; options.guessCellValueTypes = this._optionContainerElmts.guessCellValueTypesCheckbox[0].checked;
@ -113,6 +114,7 @@ Refine.WikitextParserUI.prototype._initialize = function() {
$('#or-import-rows2').text($.i18n._('core-index-parser')["rows-data"]); $('#or-import-rows2').text($.i18n._('core-index-parser')["rows-data"]);
$('#or-import-parseCell').html($.i18n._('core-index-parser')["parse-cell"]); $('#or-import-parseCell').html($.i18n._('core-index-parser')["parse-cell"]);
$('#or-import-blankSpanningCells').text($.i18n._('core-index-parser')["blank-spanning-cells"]); $('#or-import-blankSpanningCells').text($.i18n._('core-index-parser')["blank-spanning-cells"]);
$('#or-import-includeRawTemplates').text($.i18n._('core-index-parser')["include-raw-templates"]);
$('#or-import-blank').text($.i18n._('core-index-parser')["store-blank"]); $('#or-import-blank').text($.i18n._('core-index-parser')["store-blank"]);
$('#or-import-null').text($.i18n._('core-index-parser')["store-nulls"]); $('#or-import-null').text($.i18n._('core-index-parser')["store-nulls"]);
$('#or-import-source').html($.i18n._('core-index-parser')["store-source"]); $('#or-import-source').html($.i18n._('core-index-parser')["store-source"]);
@ -142,6 +144,10 @@ Refine.WikitextParserUI.prototype._initialize = function() {
this._optionContainerElmts.blankSpanningCellsCheckbox.prop("checked", true); this._optionContainerElmts.blankSpanningCellsCheckbox.prop("checked", true);
} }
if (this._config.includeRawTemplates) {
this._optionContainerElmts.includeRawTemplatesCheckbox.prop("checked", true);
}
if (this._config.storeBlankRows) { if (this._config.storeBlankRows) {
this._optionContainerElmts.storeBlankRowsCheckbox.prop("checked", true); this._optionContainerElmts.storeBlankRowsCheckbox.prop("checked", true);
} }