installation on poleng computer, clean up

This commit is contained in:
rjawor 2018-08-29 12:56:47 +02:00
parent 8e1d2d2c42
commit 7d3fa9e2ae
6 changed files with 18 additions and 14 deletions

3
.gitignore vendored
View File

@ -1,6 +1,7 @@
build/
logs/concordia-server.log
logs/pgbouncer.log
pgbouncer.log
logs/phrase-searches.json
concordia.cfg
concordia-server/config.hpp
@ -40,3 +41,5 @@ import-requests/request_handler.pid
mgiza-aligner/corpus-compilator/corpora
mgiza-aligner/corpus-compilator/dictionaries/*lem
mgiza-aligner/corpus-compilator/dictionary-compilator/*.tsv
mgiza-aligner/mgiza/mgizapp/inst/
mgiza-aligner/mgiza/mgizapp/install_manifest.txt

View File

@ -6,7 +6,7 @@
- grant all privileges on database concordia_server to concordia;
- sudo vim /etc/postgresql/9.3/main/pg_hba.conf: change "local all all peer" to "local all all md5"
- pgbouncer:
- sudo apt-get install autoconf automake m4 libtool pkg-config libevent-dev autogen
- sudo apt-get install autoconf automake m4 libtool pkg-config libevent-dev autogen python-docutils
$ git clone https://github.com/pgbouncer/pgbouncer.git
$ cd pgbouncer
$ git submodule init

View File

@ -1,10 +1,10 @@
dir@#@europarl_sample
concordia_host@#@localhost
concordia_port@#@8800
tmid@#@1
desc@#@Europarl sample (1000 sentences)
enjoy@#@Życzymy udanej pracy z systemem!
prompt@#@Wprowadź zdanie (po polsku):
suggestion@#@Na każde państwo członkowskie Unii Europejskiej przypada jeden komisarz.
suggestion@#@Komisja Europejska przygotowuje raport na najbliższym posiedzeniu.
suggestion@#@Wspólny Komitet przyjmuje swój statut.
tmid@#@2
desc@#@Welcome to the interactive Concordia demo. The system finds the longest matches of the pattern sentence in its translation memory. This translation memory is over 1.5M sentences taken from English-Polish corpus of European Law (Europarl + JRC-Acquis). Please enter an English sentence in the field below and press Enter (or use the search button). This instance of Concordia works best with law sentences, but is very likely to output some results for any English sentence. You can also use predefined samples, simply use the link "show/hide samples" and apply one of the sample sentences. After the search, click on the highlighted fragments to see their context.
enjoy@#@Enjoy your work with the system!
prompt@#@Enter search pattern (English sentence):
suggestion@#@Every ship in the European Union must have a crew of 50 or more workers.
suggestion@#@It is impossible to abolish the customs duties on fruit and vegetables.
suggestion@#@The convention on human rights was held in Geneva.

View File

@ -0,0 +1 @@
../versions_available/europarl_sample.cfg

View File

@ -1,9 +1,9 @@
SRC_LANG=pl
TRG_LANG=en
SRC_LANG=en
TRG_LANG=pl
CORPUS_NAME=europarl_sample
SEPARATOR=@\#@
DICTIONARY_WEIGHT=0
DICTIONARY_WEIGHT=3
all: corpora/$(CORPUS_NAME)/aligned_final.txt corpora/$(CORPUS_NAME)/src_final.txt corpora/$(CORPUS_NAME)/trg_final.txt

View File

@ -1,7 +1,7 @@
#!/bin/sh
CORPUS_NAME="stocznia_plen"
SRC_LANG_ID=1
TRG_LANG_ID=2
CORPUS_NAME="europarl_sample"
SRC_LANG_ID=2
TRG_LANG_ID=1
./addAlignedLemmatizedTM.py $CORPUS_NAME ../mgiza-aligner/corpora/$CORPUS_NAME/src_final.txt $SRC_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/trg_final.txt $TRG_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/aligned_final.txt