From 01a70fe444cf9a6edfe3e2a473f54145613af3cb Mon Sep 17 00:00:00 2001 From: rjawor Date: Fri, 28 Apr 2017 13:49:30 +0200 Subject: [PATCH] corrected case --- cat/js/cat.js | 12 +++- cat/versions_available/europarl_sample.cfg | 10 +++ cat/versions_enabled/europarl_sample.cfg | 1 + cat/versions_enabled/stocznia_enpl.cfg | 1 - cat/versions_enabled/stocznia_plen.cfg | 1 - concordia-server/index_controller.cpp | 4 +- concordia-server/searcher_controller.cpp | 15 ++-- concordia-server/unit_dao.cpp | 22 ++---- concordia.cfg.in | 18 ++--- mgiza-aligner/Makefile | 72 ++++++++++--------- mgiza-aligner/clean_corpus.py | 24 +++++++ mgiza-aligner/cut.py | 12 ++++ mgiza-aligner/giza.cfg.pattern | 8 +-- mgiza-aligner/paste.py | 15 ++++ resources/anonymizer/named_entities.txt | 3 - .../{anonymizer => tokenizer}/html_tags.txt | 0 resources/tokenizer/named_entities.txt | 5 ++ .../space_symbols.txt | 0 .../stop_symbols.txt | 0 .../{anonymizer => tokenizer}/stop_words.txt | 0 tests/addLemmatizedTM.sh | 8 +-- 21 files changed, 139 insertions(+), 92 deletions(-) create mode 100644 cat/versions_available/europarl_sample.cfg create mode 120000 cat/versions_enabled/europarl_sample.cfg delete mode 120000 cat/versions_enabled/stocznia_enpl.cfg delete mode 120000 cat/versions_enabled/stocznia_plen.cfg create mode 100755 mgiza-aligner/clean_corpus.py create mode 100755 mgiza-aligner/cut.py create mode 100755 mgiza-aligner/paste.py delete mode 100644 resources/anonymizer/named_entities.txt rename resources/{anonymizer => tokenizer}/html_tags.txt (100%) create mode 100644 resources/tokenizer/named_entities.txt rename resources/{anonymizer => tokenizer}/space_symbols.txt (100%) rename resources/{anonymizer => tokenizer}/stop_symbols.txt (100%) rename resources/{anonymizer => tokenizer}/stop_words.txt (100%) diff --git a/cat/js/cat.js b/cat/js/cat.js index 08513ed..eddcde7 100644 --- a/cat/js/cat.js +++ b/cat/js/cat.js @@ -69,10 +69,10 @@ function renderResult(data) { for(var i = 0; i < data['result']['bestOverlay'].length; i++) { var fragment = data['result']['bestOverlay'][i]; //previous unmarked fragment - markedSentence += inputSentence.slice(lastInsertedEnd, fragment['matchedPatternStart']); + markedSentence += htmlEncode(inputSentence.slice(lastInsertedEnd, fragment['matchedPatternStart'])); //the marked fragment - markedSentence += ''+inputSentence.slice(fragment['matchedPatternStart'], fragment['matchedPatternEnd'])+''; + markedSentence += ''+htmlEncode(inputSentence.slice(fragment['matchedPatternStart'], fragment['matchedPatternEnd']))+''; lastInsertedEnd = fragment['matchedPatternEnd']; @@ -80,7 +80,7 @@ function renderResult(data) { } //remaining unmarked fragment - markedSentence += inputSentence.slice(lastInsertedEnd); + markedSentence += htmlEncode(inputSentence.slice(lastInsertedEnd)); res += '
'+markedSentence+'
'; @@ -89,6 +89,12 @@ function renderResult(data) { return res; } +function htmlEncode(value){ + // Create a in-memory div, set its inner text (which jQuery automatically encodes) + // Then grab the encoded contents back out. The div never exists on the page. + return $('
').text(value).html(); +} + function renderFragment(fragment, number) { var result = '