gph i dgc obsluguja configi

git-svn-id: svn://atos.wmid.amu.edu.pl/utt@33 e293616e-ec6a-49c2-aa92-f4a8b91c5d16
This commit is contained in:
pawelk 2008-04-24 10:36:13 +00:00
parent a5fdde9613
commit 19dfa5cb76
3 changed files with 426 additions and 289 deletions

View File

@ -13,14 +13,14 @@ my $usr_home = catdir(home(), '.utt');
prepareUttUsrHome($usr_home);
conf_utt(catfile($usr_home, 'utt.conf'), $sys_home);
conf_compiledic(catfile($usr_home, 'compiledic.conf'), $sys_home);
conf_cor(catfile($usr_home, 'cor.conf'), $sys_home);
conf_dgc(catfile($usr_home, 'dgc.conf'), $sys_home);
conf_kor(catfile($usr_home, 'kor.conf'), $sys_home);
conf_compiledic(catfile($usr_home, 'compiledic.conf'), $sys_home);
conf_grp(catfile($usr_home, 'grp.conf'), $sys_home);
conf_gue(catfile($usr_home, 'gue.conf'), $sys_home);
conf_kor(catfile($usr_home, 'kor.conf'), $sys_home);
conf_lem(catfile($usr_home, 'lem.conf'), $sys_home);
conf_ser(catfile($usr_home, 'ser.conf'), $sys_home);
conf_dgc(catfile($usr_home, 'dgc.conf'), $sys_home);
print "UTT user configuration created in $usr_home\n";
@ -107,7 +107,7 @@ sub conf_kor() {
print FILE makeConfigHeader();
print FILE "dictionary-home=", abs_path("$utthome/share/utt"), "\n";
print FILE "weights=", abs_path("$utthome/lib/utt/weights.kor"), "\n";
print FILE "weights=", abs_path("$utthome/lib/utt/weights.cor"), "\n";
print FILE "threshold=1.0\n";
close FILE;
@ -221,8 +221,8 @@ sub conf_dgc() {
open(FILE, ">$dgc_file");
print FILE makeConfigHeader();
print FILE "categories=", abs_path("$utthome/lib/utt/cats.dgc"), "\n";
print FILE "grammar=", abs_path("$utthome/lib/utt/gram.dgc"), "\n";
print FILE "catfile=", abs_path("$utthome/lib/utt/cats.dgc"), "\n";
print FILE "gramfile=", abs_path("$utthome/lib/utt/gram.dgc"), "\n";
close FILE;

View File

@ -5,18 +5,83 @@
#version: 1.0
#author: Tomasz Obrebski
# wymaga niejawnie programu canonize!!!!
#use lib "ENV{HOME}/.utt/lib/perl";
#use strict;
use strict;
use Getopt::Long;
use Data::Dumper;
use attr;
#use File::HomeDir;
use File::HomeDir;
my $systemconfigfile='/usr/local/etc/utt/dgc.conf';
my $userconfigfile=home()."/.utt/dgc.conf";
Getopt::Long::Configure('no_ignore_case_always');
my $help=0;
my $catfile=0;
my $dicfile=0;
my $gramfile=0;
my $outputfile=0;
#read configuration files###########################
my $file;
foreach $file ($systemconfigfile, $userconfigfile){
if(open(CONFIG, $file)){
while (<CONFIG>) {
chomp;
s/#.*//;
s/^\s+//;
s/\s+$//;
next unless length;
my ($name, $value) = split(/\s*=\s*/, $_, 2);
if(($name eq "catfile")or($name eq "c")){
$catfile=$value;
}
elsif(($name eq "dicfile")or($name eq "d")){
$dicfile=$value;
}
elsif(($name eq "gramfile")or($name eq "g")){
$gramfile=$value;
}
elsif(($name eq "outputfile")or($name eq "o")){
$outputfile=$value;
}
elsif(($name eq "help")or($name eq "h")){
$help=1;
}
}
close CONFIG;
}
}
#########################################################
GetOptions("help|h" => \$help,
"catfile|c=s" => \$catfile,
"dicfile|d=s" => \$dicfile,
"gramfile|g=s" => \$gramfile,
"outputfile|o=s" => \$outputfile);
if($help)
{
print <<'END'
Usage: dgc [OPTIONS]
Options:
--catfile -c filename List of syntactic categories.
--dicfile -d filename Dictionary.
--gramfile -g filename List of grammar rules.
--outputfile -o filename Output filename.
--help -h Help.
END
;
exit 0;
}
die("At least one of --cats and --dic must be given.\n") if !$catfile && !$dicfile;
my $ncat=0;
my $nrole=0;
@ -26,42 +91,44 @@ my $nright=0;
my $nreq=0;
my $nlink=0;
GetOptions("help|h" => \$help,
"catfile|c=s" => \$catfile,
"dicfile|d=s" => \$dicfile,
"gramfile|g=s" => \$gramfile);
if($help)
{
print <<'END'
Usage: dgpcompile [OPTIONS]
Options:
--cats -c filename List of syntactic categories.
--dic -d filename Dictionary.
--help -h Help.
END
;
exit 0;
}
die("At least one of --cats and --dic must be given.\n") if !$catfile && !$dicfile;
my %cats;
my %roles;
my %agr;
my %gov;
if(!$outputfile) {
*OUTPUT = *STDOUT;
}
elsif($outputfile eq "-") {
*OUTPUT = *STDOUT;
}
else {
open(OUTPUT, ">$outputfile") or die("Can't open output file: $outputfile!");
}
loadcats($catfile) if $catfile;
extractcats($dicfile) if $dicfile;
$cats_re = qr/(?:$attr::cat_re\s*(?:,\s*$attr::cat_re)*)/;
my $cats_re = qr/(?:$attr::cat_re\s*(?:,\s*$attr::cat_re)*)/;
# class parse_class:
# /$attr::cat_re/g;
while(<>)
if(!$gramfile) {
*INPUT = *STDIN;
}
elsif($gramfile eq "-"){
*INPUT = *STDIN;
}
else {
open(INPUT, $gramfile) or die("Unable to open: $gramfile!");
}
while(<INPUT>)
{
if(/^\s*AGR\s+(\S+)\s+(\S+)\s*$/)
{
@ -74,22 +141,22 @@ while(<>)
elsif(/^\s*ROLE\s+\S+\s*$/)
{
$roles{$_}=1;
print;
print OUTPUT;
}
elsif(/^\s*SGL\s+\S+\s*$/)
{
++$nsgl;
print;
print OUTPUT;
}
elsif(/^\s*REQ\s+(\S+)\s+(\S+)\s*$/)
{
print "#$_";
print OUTPUT "#$_";
my $cat = attr::parse $1;
for my $atomcat (keys %cats)
{
if(attr::match @$cat, @{$cats{$atomcat}})
{
print "REQ ".$atomcat." $2\n";
print OUTPUT "REQ ".$atomcat." $2\n";
++$nreq;
}
}
@ -97,19 +164,19 @@ while(<>)
elsif(/^\s*LEFT\s+\S+\s*$/)
{
++$nleft;
print;
print OUTPUT;
}
elsif(/^\s*RIGHT\s+\S+\s*$/)
{
++$nright;
print;
print OUTPUT;
}
elsif(($hs,$ds,$r) = /^\s*LINK\s+($cats_re)\s+($cats_re)\s+(\S+)\s*$/)
elsif(my ($hs,$ds,$r) = /^\s*LINK\s+($cats_re)\s+($cats_re)\s+(\S+)\s*$/)
{
print "#$_";
for $h ($hs =~ /$attr::cat_re/g)
print OUTPUT "#$_";
for my $h ($hs =~ /$attr::cat_re/g)
{
for $d ($ds =~ /$attr::cat_re/g)
for my $d ($ds =~ /$attr::cat_re/g)
{
addlinks($h,$d,$r);
}
@ -118,17 +185,17 @@ while(<>)
else
{
print;
print OUTPUT;
}
}
sub addlinks
{
($h,$d,$r) = @_;
my ($h,$d,$r) = @_;
for my $a (@{$agr{$r}}) { print "#AGR $r $a\n"; }
for my $c (@{$gov{$r}}) { print "#GOV $r ".attr::unparse(@$c)."\n"; }
for my $a (@{$agr{$r}}) { print OUTPUT "#AGR $r $a\n"; }
for my $c (@{$gov{$r}}) { print OUTPUT "#GOV $r ".attr::unparse(@$c)."\n"; }
my $head = attr::parse $h;
my $dep = attr::parse $d;
@ -151,9 +218,9 @@ sub addlinks
next DEP if ! attr::match(@$c,@{$cats{$atomdep}});
}
print "LINK ";
print $atomhead." ";
print $atomdep." $r\n";
print OUTPUT "LINK ";
print OUTPUT $atomhead." ";
print OUTPUT $atomdep." $r\n";
++$nlink;
}
@ -179,10 +246,10 @@ sub extractcats
{
while(/,([^[:space:];]+)/g)
{
$cat=$1;
my $cat=$1;
next if !$cat || exists $cats{$cat};
$ncat++;
print "CAT $1\n";
print OUTPUT "CAT $1\n";
$cats{$cat}=attr::parse($cat);
}
}
@ -198,9 +265,10 @@ sub loadcats
{
tr/ \t\n//d;
next if !$_ || exists $cats{$_};
print "CAT $_\n";
print OUTPUT "CAT $_\n";
++$ncat;
$cats{$_}=attr::parse($_);
}
close CATFILE;
}

View File

@ -7,17 +7,72 @@
use strict;
use Getopt::Long;
use File::HomeDir;
my $systemconfigfile='/usr/local/etc/utt/gph.conf';
my $userconfigfile=home()."/.utt/gph.conf";
Getopt::Long::Configure('no_ignore_case_always');
my @process;
my $help=0;
my $inputfile=0;
my $outputfile=0;
my @process=();
my $reset;
my $interactive=1;
my $interactive=0;
#read configuration files###########################
my $file;
my @process_conf=();
foreach $file ($systemconfigfile, $userconfigfile){
if(open(CONFIG, $file)){
while (<CONFIG>) {
chomp;
s/#.*//;
s/^\s+//;
s/\s+$//;
next unless length;
my ($name, $value) = split(/\s*=\s*/, $_, 2);
if(($name eq "inputfile")or($name eq "f")){
$inputfile=$value;
}
elsif(($name eq "outputfile")or($name eq "o")){
$outputfile=$value;
}
elsif(($name eq "process")or($name eq "p")){
push @process_conf, $value;
}
elsif(($name eq "reset")or($name eq "r")){
$reset=$value;
}
elsif(($name eq "interactive")or($name eq "i")){
$interactive=1;
}
elsif(($name eq "help")or($name eq "h")){
$help=1;
}
}
close CONFIG;
}
}
#########################################################
GetOptions("process|p=s" => \@process,
"inputfile|f=s" => \$inputfile,
"outputfile|o=s" => \$outputfile,
"help|h" => \$help,
"reset|r=s" => \$reset,
"interactive|i" => \$interactive);
@process = @process_conf if @process<1;
if($help)
{
print <<'END'
@ -26,9 +81,9 @@ Usage: gph [OPTIONS]
Options:
-p tag Process segments with this tag as nodes.
-r tag Start new graph at this tag.
-f filename Input file (NIE DZIALA).
-o filename Output file (NIE DZIALA).
-i Toggle interactive mode (default=on).
-f filename Input file.
-o filename Output file.
-i Toggle interactive mode (default=off).
END
;
exit 0;
@ -37,11 +92,25 @@ END
$|=1 if $interactive;
my @prev;
if(!$inputfile or $inputfile eq "-") {
*INPUT = *STDIN;
}
else {
open(INPUT, "$inputfile") or die("Can't open input file: $inputfile!");
}
if(!$outputfile or $outputfile eq "-") {
*OUTPUT = *STDOUT;
}
else {
open(OUTPUT, "$outputfile") or die("Can't open output file: $outputfile!");
}
my @prev;
my $n=0;
while(<>)
while(<INPUT>)
{
chomp;
my $do=0;
@ -88,6 +157,6 @@ while(<>)
}
print $_.$gph."\n";
print OUTPUT $_.$gph."\n";
}