installation on poleng computer, clean up

This commit is contained in:
rjawor 2018-08-29 12:56:47 +02:00
parent 8e1d2d2c42
commit 7d3fa9e2ae
6 changed files with 18 additions and 14 deletions

3
.gitignore vendored
View File

@ -1,6 +1,7 @@
build/ build/
logs/concordia-server.log logs/concordia-server.log
logs/pgbouncer.log logs/pgbouncer.log
pgbouncer.log
logs/phrase-searches.json logs/phrase-searches.json
concordia.cfg concordia.cfg
concordia-server/config.hpp concordia-server/config.hpp
@ -40,3 +41,5 @@ import-requests/request_handler.pid
mgiza-aligner/corpus-compilator/corpora mgiza-aligner/corpus-compilator/corpora
mgiza-aligner/corpus-compilator/dictionaries/*lem mgiza-aligner/corpus-compilator/dictionaries/*lem
mgiza-aligner/corpus-compilator/dictionary-compilator/*.tsv mgiza-aligner/corpus-compilator/dictionary-compilator/*.tsv
mgiza-aligner/mgiza/mgizapp/inst/
mgiza-aligner/mgiza/mgizapp/install_manifest.txt

View File

@ -6,7 +6,7 @@
- grant all privileges on database concordia_server to concordia; - grant all privileges on database concordia_server to concordia;
- sudo vim /etc/postgresql/9.3/main/pg_hba.conf: change "local all all peer" to "local all all md5" - sudo vim /etc/postgresql/9.3/main/pg_hba.conf: change "local all all peer" to "local all all md5"
- pgbouncer: - pgbouncer:
- sudo apt-get install autoconf automake m4 libtool pkg-config libevent-dev autogen - sudo apt-get install autoconf automake m4 libtool pkg-config libevent-dev autogen python-docutils
$ git clone https://github.com/pgbouncer/pgbouncer.git $ git clone https://github.com/pgbouncer/pgbouncer.git
$ cd pgbouncer $ cd pgbouncer
$ git submodule init $ git submodule init

View File

@ -1,10 +1,10 @@
dir@#@europarl_sample dir@#@europarl_sample
concordia_host@#@localhost concordia_host@#@localhost
concordia_port@#@8800 concordia_port@#@8800
tmid@#@1 tmid@#@2
desc@#@Europarl sample (1000 sentences) desc@#@Welcome to the interactive Concordia demo. The system finds the longest matches of the pattern sentence in its translation memory. This translation memory is over 1.5M sentences taken from English-Polish corpus of European Law (Europarl + JRC-Acquis). Please enter an English sentence in the field below and press Enter (or use the search button). This instance of Concordia works best with law sentences, but is very likely to output some results for any English sentence. You can also use predefined samples, simply use the link "show/hide samples" and apply one of the sample sentences. After the search, click on the highlighted fragments to see their context.
enjoy@#@Życzymy udanej pracy z systemem! enjoy@#@Enjoy your work with the system!
prompt@#@Wprowadź zdanie (po polsku): prompt@#@Enter search pattern (English sentence):
suggestion@#@Na każde państwo członkowskie Unii Europejskiej przypada jeden komisarz. suggestion@#@Every ship in the European Union must have a crew of 50 or more workers.
suggestion@#@Komisja Europejska przygotowuje raport na najbliższym posiedzeniu. suggestion@#@It is impossible to abolish the customs duties on fruit and vegetables.
suggestion@#@Wspólny Komitet przyjmuje swój statut. suggestion@#@The convention on human rights was held in Geneva.

View File

@ -0,0 +1 @@
../versions_available/europarl_sample.cfg

View File

@ -1,9 +1,9 @@
SRC_LANG=pl SRC_LANG=en
TRG_LANG=en TRG_LANG=pl
CORPUS_NAME=europarl_sample CORPUS_NAME=europarl_sample
SEPARATOR=@\#@ SEPARATOR=@\#@
DICTIONARY_WEIGHT=0 DICTIONARY_WEIGHT=3
all: corpora/$(CORPUS_NAME)/aligned_final.txt corpora/$(CORPUS_NAME)/src_final.txt corpora/$(CORPUS_NAME)/trg_final.txt all: corpora/$(CORPUS_NAME)/aligned_final.txt corpora/$(CORPUS_NAME)/src_final.txt corpora/$(CORPUS_NAME)/trg_final.txt

View File

@ -1,7 +1,7 @@
#!/bin/sh #!/bin/sh
CORPUS_NAME="stocznia_plen" CORPUS_NAME="europarl_sample"
SRC_LANG_ID=1 SRC_LANG_ID=2
TRG_LANG_ID=2 TRG_LANG_ID=1
./addAlignedLemmatizedTM.py $CORPUS_NAME ../mgiza-aligner/corpora/$CORPUS_NAME/src_final.txt $SRC_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/trg_final.txt $TRG_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/aligned_final.txt ./addAlignedLemmatizedTM.py $CORPUS_NAME ../mgiza-aligner/corpora/$CORPUS_NAME/src_final.txt $SRC_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/trg_final.txt $TRG_LANG_ID ../mgiza-aligner/corpora/$CORPUS_NAME/aligned_final.txt