diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..2b079b0 --- /dev/null +++ b/.gitignore @@ -0,0 +1,4 @@ +*.tsv +*.txt +*.trn +results diff --git a/count_lines.sh b/count_lines.sh old mode 100644 new mode 100755 index 3c3a81f..9b73c27 --- a/count_lines.sh +++ b/count_lines.sh @@ -3,28 +3,34 @@ #zad 1 wc -l wikiniews_results.tsv > counted_lines_result.txt -#zad 3 -cut --fields=2 wikiniews_results.tsv > hypothesis.txt -cut --fields=3 wikiniews_results.tsv > reference.txt - -awk 'BEGIN{FS=OFS="\t"}{print $0,"(sp1_"NR")"}' < hypothesis.txt > hypothesis.trn -awk 'BEGIN{FS=OFS="\t"}{print $0,"(sp1_"NR")"}' < reference.txt > reference.trn - -sclite -f 0 -r reference.trn trn -h hypothesis.trn trn -e utf-8 -i rm -o all stdout | grep Score > results - -# #C #S #D #I do obliczen WER -awk 'BEGIN{OFS="\t"}{print $6, $7, $8, $9}' < results | awk '{ print ($2 + $3 + $4)/($2 + $3 + $1) }' > wer.tsv - -paste wikiniews_results.tsv wer.tsv > wikiniews_results.tsv - -awk 'BEGIN{FS=OFS="\t"}{ bad = bad + $1; all++ }END{ print bad/all }' < wer.tsv >> wer.txt -awk 'BEGIN{FS=OFS="\t"}{ if ( $1 == 0 ) good++; all++ }END{ print good/all }' < wer.tsv >> srr.txt - -tail -n 50 wer.txt > wer1.txt -tail -n 50 srr.txt > srr1.txt - -rm wer.txt -rm srr.txt - -mv wer1.txt wer.txt -mv srr1.txt srr.txt +##zad 3 +## dzielenie linii +#cut --fields=2 wikiniews_results.tsv > hypothesis.txt +#cut --fields=3 wikiniews_results.tsv > reference.txt +# +## tworzenie plikow trn +#awk 'BEGIN{FS=OFS="\t"}{print $0,"(sp1_"NR")"}' < hypothesis.txt > hypothesis.trn +#awk 'BEGIN{FS=OFS="\t"}{print $0,"(sp1_"NR")"}' < reference.txt > reference.trn +# +#sclite -f 0 -r reference.trn trn -h hypothesis.trn trn -e utf-8 -i rm -o all stdout | grep Score > results +# +## #correct words #substitutions #deletions #insertions do obliczen WER +#awk 'BEGIN{OFS="\t"}{print $6, $7, $8, $9}' < results | awk '{ print ($2 + $3 + $4)/($2 + $3 + $1) }' > wer.tsv +# +#paste wikiniews_results.tsv wer.tsv > wikiniews_results.tsv +# +## procent niepoprawnie rozpoznanych wyrazów +#awk 'BEGIN{FS=OFS="\t"}{ bad = bad + $1; all++ }END{ print bad/all }' < wer.tsv >> wer.txt +# +## procent całkowicie poprawnie rozpoznanych zdań +#awk 'BEGIN{FS=OFS="\t"}{ if ( $1 == 0 ) good++; all++ }END{ print good/all }' < wer.tsv >> srr.txt +# +## zamiana treści +#tail -n 50 wer.txt > wer1.txt +#tail -n 50 srr.txt > srr1.txt +# +#rm wer.txt +#rm srr.txt +# +#mv wer1.txt wer.txt +#mv srr1.txt srr.txt diff --git a/wikiniews_results.tsv b/wikiniews_results.tsv index d48080b..e69de29 100644 --- a/wikiniews_results.tsv +++ b/wikiniews_results.tsv @@ -1,200 +0,0 @@ - 0 - 0 - 0 - 0.133333 - 0 - 0.363636 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.0588235 - 0 - 0 - 0.375 - 0 - 0 - 0 - 0.105263 - 0 - 0.24 - 0 - 0 - 0.2 - 0.333333 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.142857 - 0.173913 - 0 - 0 - 0 - 0 - 0 - 0.0645161 - 0.470588 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.84 - 0 - 0.0625 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.0454545 - 0 - 0 - 0 - 0 - 0.117647 - 0 - 0.137931 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.703704 - 0 - 0.0357143 - 0 - 0 - 0.0714286 - 0 - 0.15 - 0.136364 - 0 - 0 - 0.0588235 - 0 - 0 - 0.333333 - 0 - 0 - 0 - 0.15 - 0 - 0 - 0.153846 - 0.0714286 - 0 - 0 - 0 - 0 - 0.0909091 - 0 - 0 - 0 - 0 - 0 - 0 - 0.0666667 - 0 - 0.645161 - 0 - 0 - 0.0625 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.5 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.133333 - 0.105263 - 0.692308 - 0 - 0 - 0 - 0 - 0 - 0 - 0.0625 - 0 - 0 - 0.25 - 0.214286 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.03125 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.047619 - 0.8 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0 - 0.0588235 - 0 - 0 - 0.2