a6e708f37f
Revert "Replacing old implementation with working implementation"
This reverts commit 1e121f45e2
.
Please enter the commit message for your changes. Lines starting
with '#' will be ignored, and an empty message aborts the commit.
Committer: tom <tom@lim.(none)>
On branch master
Changes to be committed:
(use "git reset HEAD <file>..." to unstage)
modified: _old/app/Makefile
deleted: _old/app/conf/Makefile
deleted: _old/app/conf/compiledic.conf
deleted: _old/app/conf/cor.conf
deleted: _old/app/conf/dgc.conf
deleted: _old/app/conf/dgp.conf
deleted: _old/app/conf/gph.conf
deleted: _old/app/conf/grp.conf
deleted: _old/app/conf/gue.conf
deleted: _old/app/conf/kor.conf
deleted: _old/app/conf/lem.conf
deleted: _old/app/conf/mar.conf
deleted: _old/app/conf/ser.conf
deleted: _old/app/conf/utt.conf
modified: _old/app/src/common/Makefile
modified: _old/app/src/compiledic/Makefile
modified: _old/app/src/compiledic/aut2fsa.cc
modified: _old/app/src/cor/Makefile
modified: _old/app/src/dgp/Makefile
new file: _old/app/src/dgp/canonize
new file: _old/app/src/dgp/dgc
modified: _old/app/src/dgp/grammar.hh
modified: _old/app/src/dgp/mgraph.hh
modified: _old/app/src/dgp/sgraph.hh
modified: _old/app/src/dgp/thesymbols.hh
new file: _old/app/src/dgp/tre
modified: _old/app/src/gue/Makefile
modified: _old/app/src/gue/guess.cc
modified: _old/app/src/kor/Makefile
modified: _old/app/src/kor/corlist.cc
modified: _old/app/src/kor/corr.cc
new file: _old/app/src/kor/corr.hh
modified: _old/app/src/kor/main.cc
modified: _old/app/src/lem/Makefile
modified: _old/app/src/lem/lem.cc
modified: _old/app/src/lib/Makefile
modified: _old/app/src/lib/auttools.cc
modified: _old/app/src/lib/symtab.cc
modified: _old/app/src/lib/tft.h
modified: _old/app/src/lib/tfti.h
modified: _old/app/src/lib/ttrans.h
modified: _old/app/src/lib/word.cc
modified: _old/app/src/lib/word.h
modified: _old/app/src/tok.c/Makefile
modified: _old/app/src/tok.c/cmdline_tok.ggo
modified: _old/app/src/tok.c/common_tok.cc
modified: _old/app/src/tok/Makefile
modified: _old/nawszelkiwypadek/tools/aut2fsa
modified: _old/nawszelkiwypadek/tools/cor_dic/makeLabels.pl
modified: _old/nawszelkiwypadek/tools/cor_dic/prep.pl
modified: _old/nawszelkiwypadek/tools/fsm2aut
modified: _old/nawszelkiwypadek/tools/gue_dic/canon.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/compile_user_dict.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/count_prefs.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/cut_prefs.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/makeLabels.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/prep.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/prep_user_dict.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/rmDup.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/stat.pl
modified: _old/nawszelkiwypadek/tools/gue_dic/stat_pre.pl
modified: _old/nawszelkiwypadek/tools/lem_dic/makeLabels.pl
modified: _old/nawszelkiwypadek/tools/lem_dic/prep.pl
modified: auto/defaults
modified: auto/options
modified: auto/output/Makefile
modified: auto/output/config_h
modified: auto/summary
modified: configure
56 lines
1.1 KiB
Perl
Executable File
56 lines
1.1 KiB
Perl
Executable File
#!/usr/bin/perl
|
|
|
|
# Usuwa zbędne powtórzenia scieżek
|
|
|
|
use locale;
|
|
|
|
#if (@ARGV < 1) {
|
|
# print "USAGE: remDup.pl num\n\tGdzie \"num\" jest ilością powtórzeń, które zostawiamy\n";
|
|
# exit(0);
|
|
#}
|
|
|
|
|
|
|
|
#ilość powtórzeń, które zostawiamy
|
|
$max = 10;
|
|
|
|
# przyjmujemy, ze na wejściu znajduje się plik posortowany,
|
|
# po końcówkach oraz po prawdopodobieństwie
|
|
|
|
$line = <>;
|
|
|
|
while (($line !~ m/^$/) || ($line =~ m/^\n$/)) {
|
|
|
|
$count = 0;
|
|
|
|
while ($line =~ m/^\n$/) {
|
|
$line = <>;
|
|
}
|
|
|
|
$line =~ /^([^~]+)~.*/;
|
|
$theEnd = $1;
|
|
$end = $1;
|
|
|
|
while (($end =~ m/$theEnd/) && ($count++ < $max)) {
|
|
print $line;
|
|
$line = <>;
|
|
$line =~ /^([^~]+)~.*/;
|
|
$end = $1;
|
|
}
|
|
|
|
# tutaj mamy dwie możliwości:
|
|
# 1. wypisaliśmy już max lini - musimy wywalić kolejne linie, które
|
|
# zawierają końcówkę theEnd,
|
|
# 2. pasujących lini było mniej niż max, wtedy nic nie musimy robić
|
|
# - w zmiennej line znajduje się kolejna linia...
|
|
|
|
if ($count == $max + 1) {
|
|
while ($oldEnd =~ m/$theEnd/) {
|
|
$line = <>;
|
|
$line =~ /^([^~]+)~.*/;
|
|
$oldEnd = $1;
|
|
}
|
|
}
|
|
|
|
}
|