challenging-america-word-ga.../run.py

19 lines
552 B
Python
Raw Normal View History

2023-03-29 11:07:35 +02:00
#!/usr/bin/python3
2023-06-14 22:50:53 +02:00
from scripts.language_utils import predict_gaps, train_model, load_lexicon
2023-03-29 11:14:30 +02:00
2023-06-14 22:50:53 +02:00
WORDS_LIMIT = 10
if __name__ == "__main__":
lexicon = load_lexicon("./words_alpha.txt")
model = train_model("./train/in.tsv.xz", "./train/expected.tsv", lexicon)
for i, (directory, lines_no) in enumerate(zip(["dev-0", "test-A"], (10519, 7414))):
predict_gaps(
model,
f"./{directory}/in.tsv.xz",
f"./{directory}/out.tsv",
lexicon,
lines_no,
WORDS_LIMIT,
)