Add option to include raw templates as cells
This commit is contained in:
parent
554b75fa7b
commit
0a00fd9318
@ -19,6 +19,9 @@ import org.sweble.wikitext.parser.nodes.WtItalics;
|
|||||||
import org.sweble.wikitext.parser.nodes.WtNewline;
|
import org.sweble.wikitext.parser.nodes.WtNewline;
|
||||||
import org.sweble.wikitext.parser.nodes.WtNode;
|
import org.sweble.wikitext.parser.nodes.WtNode;
|
||||||
import org.sweble.wikitext.parser.nodes.WtSection;
|
import org.sweble.wikitext.parser.nodes.WtSection;
|
||||||
|
import org.sweble.wikitext.parser.nodes.WtTemplate;
|
||||||
|
import org.sweble.wikitext.parser.nodes.WtTemplateArgument;
|
||||||
|
import org.sweble.wikitext.parser.nodes.WtTemplateArguments;
|
||||||
import org.sweble.wikitext.parser.nodes.WtText;
|
import org.sweble.wikitext.parser.nodes.WtText;
|
||||||
import org.sweble.wikitext.parser.nodes.WtInternalLink;
|
import org.sweble.wikitext.parser.nodes.WtInternalLink;
|
||||||
import org.sweble.wikitext.parser.nodes.WtExternalLink;
|
import org.sweble.wikitext.parser.nodes.WtExternalLink;
|
||||||
@ -77,6 +80,7 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
|
|
||||||
JSONUtilities.safePut(options, "guessCellValueTypes", false);
|
JSONUtilities.safePut(options, "guessCellValueTypes", false);
|
||||||
JSONUtilities.safePut(options, "blankSpanningCells", true);
|
JSONUtilities.safePut(options, "blankSpanningCells", true);
|
||||||
|
JSONUtilities.safePut(options, "includeRawTemplates", false);
|
||||||
JSONUtilities.safePut(options, "wikiUrl", "https://en.wikipedia.org/wiki/");
|
JSONUtilities.safePut(options, "wikiUrl", "https://en.wikipedia.org/wiki/");
|
||||||
|
|
||||||
return options;
|
return options;
|
||||||
@ -125,6 +129,7 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
private List<String> currentRow;
|
private List<String> currentRow;
|
||||||
|
|
||||||
private boolean blankSpanningCells;
|
private boolean blankSpanningCells;
|
||||||
|
private boolean includeRawTemplates;
|
||||||
|
|
||||||
private int rowId;
|
private int rowId;
|
||||||
private List<SpanningCell> spanningCells;
|
private List<SpanningCell> spanningCells;
|
||||||
@ -138,8 +143,9 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
private int spanningCellIdx;
|
private int spanningCellIdx;
|
||||||
private List<String> internalLinksInCell;
|
private List<String> internalLinksInCell;
|
||||||
|
|
||||||
public WikitextTableVisitor(boolean blankSpanningCells) {
|
public WikitextTableVisitor(boolean blankSpanningCells, boolean includeRawTemplates) {
|
||||||
this.blankSpanningCells = blankSpanningCells;
|
this.blankSpanningCells = blankSpanningCells;
|
||||||
|
this.includeRawTemplates = includeRawTemplates;
|
||||||
caption = null;
|
caption = null;
|
||||||
header = new ArrayList<String>();
|
header = new ArrayList<String>();
|
||||||
rows = new ArrayList<List<String>>();
|
rows = new ArrayList<List<String>>();
|
||||||
@ -165,7 +171,7 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
|
|
||||||
public void visit(WtNode e) {
|
public void visit(WtNode e) {
|
||||||
// Ignore other nodes
|
// Ignore other nodes
|
||||||
// System.out.println(e.getNodeName());
|
System.out.println(e.getNodeName());
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Table handling */
|
/* Table handling */
|
||||||
@ -343,7 +349,11 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
}
|
}
|
||||||
|
|
||||||
public void visit(WtName e) {
|
public void visit(WtName e) {
|
||||||
|
try {
|
||||||
currentXmlAttr = e.getAsString();
|
currentXmlAttr = e.getAsString();
|
||||||
|
} catch (UnsupportedOperationException _) {
|
||||||
|
currentXmlAttr = null;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
public void visit(WtValue e) {
|
public void visit(WtValue e) {
|
||||||
@ -352,7 +362,6 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
|
|
||||||
/* Link management */
|
/* Link management */
|
||||||
|
|
||||||
|
|
||||||
public void visit(WtInternalLink e) {
|
public void visit(WtInternalLink e) {
|
||||||
currentInternalLink = e.getTarget().getAsString();
|
currentInternalLink = e.getTarget().getAsString();
|
||||||
internalLinksInCell.add(currentInternalLink);
|
internalLinksInCell.add(currentInternalLink);
|
||||||
@ -396,6 +405,29 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
// already handled, in WtExternalLink, added here for clarity
|
// already handled, in WtExternalLink, added here for clarity
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* Templates */
|
||||||
|
|
||||||
|
public void visit(WtTemplate e) {
|
||||||
|
if (includeRawTemplates) {
|
||||||
|
writeText("{{"+e.getName().getAsString());
|
||||||
|
WtTemplateArguments args = e.getArgs();
|
||||||
|
for (int i = 0; i != args.size(); i++) {
|
||||||
|
writeText("|");
|
||||||
|
iterate(args.get(i));
|
||||||
|
}
|
||||||
|
writeText("}}");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public void visit(WtTemplateArgument e) {
|
||||||
|
writeText("|");
|
||||||
|
if(e.hasName()) {
|
||||||
|
writeText(e.getName().getAsString());
|
||||||
|
writeText("=");
|
||||||
|
}
|
||||||
|
iterate(e.getValue());
|
||||||
|
}
|
||||||
|
|
||||||
/* Content blocks */
|
/* Content blocks */
|
||||||
|
|
||||||
public void visit(WtParsedWikitextPage e) {
|
public void visit(WtParsedWikitextPage e) {
|
||||||
@ -546,7 +578,8 @@ public class WikitextImporter extends TabularImportingParserBase {
|
|||||||
|
|
||||||
// Compile the retrieved page
|
// Compile the retrieved page
|
||||||
boolean blankSpanningCells = JSONUtilities.getBoolean(options, "blankSpanningCells", true);
|
boolean blankSpanningCells = JSONUtilities.getBoolean(options, "blankSpanningCells", true);
|
||||||
final WikitextTableVisitor vs = new WikitextTableVisitor(blankSpanningCells);
|
boolean includeRawTemplates = JSONUtilities.getBoolean(options, "includeRawTemplates", false);
|
||||||
|
final WikitextTableVisitor vs = new WikitextTableVisitor(blankSpanningCells, includeRawTemplates);
|
||||||
vs.go(parsedArticle);
|
vs.go(parsedArticle);
|
||||||
|
|
||||||
WikiTableDataReader dataReader = new WikiTableDataReader(vs);
|
WikiTableDataReader dataReader = new WikiTableDataReader(vs);
|
||||||
|
@ -114,6 +114,7 @@
|
|||||||
"store-blank": "Store blank rows",
|
"store-blank": "Store blank rows",
|
||||||
"store-nulls": "Store blank cells as nulls",
|
"store-nulls": "Store blank cells as nulls",
|
||||||
"blank-spanning-cells": "Pad cells spanning over multiple rows or columns with nulls",
|
"blank-spanning-cells": "Pad cells spanning over multiple rows or columns with nulls",
|
||||||
|
"include-raw-templates": "Include raw templates as wikicode",
|
||||||
"wiki-base-url": "Reconcile to wiki with base URL:",
|
"wiki-base-url": "Reconcile to wiki with base URL:",
|
||||||
"invalid-wikitext": "No table could be parsed. Are you sure this is a valid wiki table?",
|
"invalid-wikitext": "No table could be parsed. Are you sure this is a valid wiki table?",
|
||||||
"store-source": "Store file source <br/>(file names, URLs)<br/>in each row",
|
"store-source": "Store file source <br/>(file names, URLs)<br/>in each row",
|
||||||
|
@ -13,6 +13,8 @@
|
|||||||
<td><label for="$blank-spanning-cells" id="or-import-blankSpanningCells"></label></td></tr>
|
<td><label for="$blank-spanning-cells" id="or-import-blankSpanningCells"></label></td></tr>
|
||||||
<tr><td width="1%"><input type="checkbox" bind="storeBlankRowsCheckbox" id="$store-blank-rows" /></td>
|
<tr><td width="1%"><input type="checkbox" bind="storeBlankRowsCheckbox" id="$store-blank-rows" /></td>
|
||||||
<td colspan="2"><label for="$store-blank-rows" id="or-import-blank"></label></td></tr>
|
<td colspan="2"><label for="$store-blank-rows" id="or-import-blank"></label></td></tr>
|
||||||
|
<tr><td width="1%"><input type="checkbox" bind="includeRawTemplatesCheckbox" id="$include-raw-templates" /></td>
|
||||||
|
<td colspan="2"><label for="$include-raw-templates" id="or-import-includeRawTemplates"></label></td></tr>
|
||||||
|
|
||||||
<tr><td width="1%"><input type="checkbox" bind="storeBlankCellsAsNullsCheckbox" id="$store-blank-cells" /></td>
|
<tr><td width="1%"><input type="checkbox" bind="storeBlankCellsAsNullsCheckbox" id="$store-blank-cells" /></td>
|
||||||
<td colspan="2"><label for="$store-blank-cells" id="or-import-null"></label></td></tr>
|
<td colspan="2"><label for="$store-blank-cells" id="or-import-null"></label></td></tr>
|
||||||
|
@ -87,6 +87,7 @@ Refine.WikitextParserUI.prototype.getOptions = function() {
|
|||||||
}
|
}
|
||||||
options.storeBlankRows = this._optionContainerElmts.storeBlankRowsCheckbox[0].checked;
|
options.storeBlankRows = this._optionContainerElmts.storeBlankRowsCheckbox[0].checked;
|
||||||
options.blankSpanningCells = this._optionContainerElmts.blankSpanningCellsCheckbox[0].checked;
|
options.blankSpanningCells = this._optionContainerElmts.blankSpanningCellsCheckbox[0].checked;
|
||||||
|
options.includeRawTemplates = this._optionContainerElmts.includeRawTemplatesCheckbox[0].checked;
|
||||||
|
|
||||||
options.guessCellValueTypes = this._optionContainerElmts.guessCellValueTypesCheckbox[0].checked;
|
options.guessCellValueTypes = this._optionContainerElmts.guessCellValueTypesCheckbox[0].checked;
|
||||||
|
|
||||||
@ -113,6 +114,7 @@ Refine.WikitextParserUI.prototype._initialize = function() {
|
|||||||
$('#or-import-rows2').text($.i18n._('core-index-parser')["rows-data"]);
|
$('#or-import-rows2').text($.i18n._('core-index-parser')["rows-data"]);
|
||||||
$('#or-import-parseCell').html($.i18n._('core-index-parser')["parse-cell"]);
|
$('#or-import-parseCell').html($.i18n._('core-index-parser')["parse-cell"]);
|
||||||
$('#or-import-blankSpanningCells').text($.i18n._('core-index-parser')["blank-spanning-cells"]);
|
$('#or-import-blankSpanningCells').text($.i18n._('core-index-parser')["blank-spanning-cells"]);
|
||||||
|
$('#or-import-includeRawTemplates').text($.i18n._('core-index-parser')["include-raw-templates"]);
|
||||||
$('#or-import-blank').text($.i18n._('core-index-parser')["store-blank"]);
|
$('#or-import-blank').text($.i18n._('core-index-parser')["store-blank"]);
|
||||||
$('#or-import-null').text($.i18n._('core-index-parser')["store-nulls"]);
|
$('#or-import-null').text($.i18n._('core-index-parser')["store-nulls"]);
|
||||||
$('#or-import-source').html($.i18n._('core-index-parser')["store-source"]);
|
$('#or-import-source').html($.i18n._('core-index-parser')["store-source"]);
|
||||||
@ -142,6 +144,10 @@ Refine.WikitextParserUI.prototype._initialize = function() {
|
|||||||
this._optionContainerElmts.blankSpanningCellsCheckbox.prop("checked", true);
|
this._optionContainerElmts.blankSpanningCellsCheckbox.prop("checked", true);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (this._config.includeRawTemplates) {
|
||||||
|
this._optionContainerElmts.includeRawTemplatesCheckbox.prop("checked", true);
|
||||||
|
}
|
||||||
|
|
||||||
if (this._config.storeBlankRows) {
|
if (this._config.storeBlankRows) {
|
||||||
this._optionContainerElmts.storeBlankRowsCheckbox.prop("checked", true);
|
this._optionContainerElmts.storeBlankRowsCheckbox.prop("checked", true);
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user