gitignore update + run.py reformat

This commit is contained in:
MatOgr 2023-06-14 22:50:53 +02:00
parent 1ff6ba7d37
commit 8b58507f52
2 changed files with 18 additions and 21 deletions

3
.gitignore vendored
View File

@ -6,3 +6,6 @@
*.o *.o
.DS_Store .DS_Store
.token .token
scripts/*
solution/*
models/*

36
run.py
View File

@ -1,24 +1,18 @@
#!/usr/bin/python3 #!/usr/bin/python3
import sys from scripts.language_utils import predict_gaps, train_model, load_lexicon
for line in sys.stdin: WORDS_LIMIT = 10
_, _, _, _, _, _, left_context, right_context = line.split("\t")
if __name__ == "__main__":
previous_word = left_context.split()[-1] lexicon = load_lexicon("./words_alpha.txt")
next_word = right_context.split()[0] model = train_model("./train/in.tsv.xz", "./train/expected.tsv", lexicon)
for i, (directory, lines_no) in enumerate(zip(["dev-0", "test-A"], (10519, 7414))):
if previous_word == "United" and next_word == "of": predict_gaps(
print("States:0.9 :0.1") model,
elif previous_word == "used": f"./{directory}/in.tsv.xz",
print("to:0.4 it:0.3 as:0.2 :0.1") f"./{directory}/out.tsv",
elif previous_word.lower() == "in": lexicon,
print("the:0.7 a:0.1 an:0.1 :0.1") lines_no,
elif previous_word.lower() == "i": WORDS_LIMIT,
print("am:0.3 was:0.3 have:0.3 :0.1") )
elif previous_word.lower() in ["he", "she", "it"]:
print("is:0.3 was:0.3 has:0.3 :0.1")
elif previous_word.lower() in "bring":
print("something:0.3 it:0.3 them:0.3 :0.1")
else:
print("the:0.5 a:0.2 an:0.2 :0.1")