Finishing up NLU module

2024-05-22 23:45:33 +02:00 · 2024-05-22 23:45:33 +02:00 · 6ca7b66fb4
commit 6ca7b66fb4
parent f0c7b481d1
17 changed files with 284 additions and 171 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,4 @@
+__pycache__
+slot-model*
+frame-model*
+nlu_cache
--- a/README.md
+++ b/README.md
@ -35,3 +35,12 @@ Agent powinien wykazywać elastyczność, adaptując się do potrzeb klienta, np
 | offer                       | rekomendacja (restauracji)                              |
 | request                     | pytanie użytkownika o wartość slotu                     |
 | select                      | prośba o dokonanie wyboru spośród przedstawionych opcji |
+
+# Obsługa projektu
+
+- Python 3.10.12
+- Instalacja dependencies `pip3 install -r requirements.txt`
+- Centralna część systemu - uruchamiamy `python3 src/main.py`
+- NLU:
+    - uczenie modeli od zera `python3 nlu_train.py`
+    - Ewaluacja `python3 evaluate.py`
--- a/evaluate.py
+++ b/evaluate.py
@ -2,11 +2,10 @@ import re
 import os
 import pandas as pd
 import numpy as np
-from nlu_utils import predict_multiple
 from flair.models import SequenceTagger
 from conllu import parse_incr
 from flair.data import Corpus
-from nlu_utils import conllu2flair, nolabel2o
+from src.utils.nlu_utils import conllu2flair, nolabel2o, predict_multiple

 # Frame model evaluation
 frame_model = SequenceTagger.load('frame-model-prod/best-model.pt')
--- a/nlu_train.py
+++ b/nlu_train.py
@ -6,7 +6,7 @@ from flair.embeddings import CharacterEmbeddings
 from flair.embeddings import FlairEmbeddings
 from flair.models import SequenceTagger
 from flair.trainers import ModelTrainer
-from nlu_utils import conllu2flair, nolabel2o
+from src.utils.nlu_utils import conllu2flair, nolabel2o

 import torch
 if torch.cuda.is_available():
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,5 @@
+flair==0.13.1
+conllu==4.5.3
+pandas==1.5.3
+numpy==1.26.4
+torch==2.3.0
--- a/src/init.py
+++ b/src/init.py
--- a/src/main.py
+++ b/src/main.py
@ -1,26 +1,38 @@
-from model.frame import Frame
 from service.dialog_state_monitor import DialogStateMonitor
 from service.dialog_policy import DialogPolicy
 from service.natural_languag_understanding import NaturalLanguageUnderstanding
 from service.natural_language_generation import NaturalLanguageGeneration

-print("Natural language understanding, example:")
-naturalLanguageUnderstanding = NaturalLanguageUnderstanding()
-print(naturalLanguageUnderstanding.convert_text_to_frame("Cześć, jak masz na imię?"))
+# initialize classes
+nlu = NaturalLanguageUnderstanding() # NLU
+monitor = DialogStateMonitor() # DSM
+dialog_policy = DialogPolicy() # DP
+language_generation = NaturalLanguageGeneration() # NLG

-# Example
-print("Dialog state monitor, examples:")
-monitor = DialogStateMonitor()
-monitor.append(Frame('system', 'hello', []))
-monitor.append(Frame('user', 'some_text', []))
-print(monitor.get_all()[0].act)
-print(monitor.get_last().act)
+# Main loop
+user_input = input("Możesz zacząć pisać.\n")
+while True:
+    # NLU
+    frame = nlu.process_input(user_input)
+    print(frame)

-print("Dialog policy, next dialogue act:")
-dialog_policy = DialogPolicy(monitor.get_all())
-print(dialog_policy.next_dialogue_act().act)
+    # DSM
+    monitor.append(frame)

-print("Natural Language Generation example:")
-agent = NaturalLanguageGeneration()
-response = agent.respond_to_name_query("Jak masz na imię?")
+    # DP
+    print(dialog_policy.next_dialogue_act(monitor.get_all()).act)
+
+    # NLG
+    response = language_generation.respond_to_name_query("Jak masz na imię?")
    print(response)
+
+    if frame.act == "bye":
+        break
+    
+    user_input = input(">\n")
+
+
+
+
+
+
--- a/src/model/init.py
+++ b/src/model/init.py
--- a/src/model/frame.py
+++ b/src/model/frame.py
@ -1,7 +1,14 @@
-from model.slot import Slot
+from .slot import Slot

 class Frame:
    def __init__(self, source: str, act: str, slots: list[Slot]):
        self.source = source
        self.slots = slots
        self.act = act
+
+    def __str__(self):
+        msg = f"Act: {self.act}, Slots: ["
+        for slot in self.slots:
+            msg += f"({slot}), "
+        msg += "]"
+        return msg
--- a/src/model/slot.py
+++ b/src/model/slot.py
@ -2,3 +2,6 @@ class Slot:
    def __init__(self, name, value=None):
        self.name = name
        self.value = value
+
+    def __str__(self) -> str:
+        return f"Name: {self.name}, Value: {self.value}"
--- a/src/nlu_example.py
+++ b/src/nlu_example.py
@ -1,8 +1,8 @@
 from flair.models import SequenceTagger
-from nlu_utils import predict_single, predict_multiple, predict_and_annotate
+from utils.nlu_utils import predict_single, predict_multiple, predict_and_annotate

 # Exploratory tests
-frame_model = SequenceTagger.load('frame-model/best-model.pt')
+frame_model = SequenceTagger.load('frame-model-prod/best-model.pt')
 tests = [
    'chciałbym zamówić pizzę',
    'na godzinę 12',
@ -16,7 +16,7 @@ tests = [
    'pizzę barcelona bez cebuli',
 ]

-# print("=== Exploratory tests - frame model ===")
+print("=== Exploratory tests - frame model ===")
 for test in tests:
    print(f"Sentence: {test}")
    print(f"Single prediction: {predict_single(frame_model, test.split(), 'frame')}")
@ -24,7 +24,7 @@ for test in tests:
    print(f"Annotated sentence: {predict_and_annotate(frame_model, test.split(), 'frame')}")

 print("=== Exploratory tests - slot model ===")
-slot_model = SequenceTagger.load('slot-model/final-model.pt')
+slot_model = SequenceTagger.load('slot-model-prod/best-model.pt')
 for test in tests:
    print(f"Sentence: {test}")
    print(f"Prediction: {predict_and_annotate(slot_model, test.split(), 'slot')}")
--- a/src/service/init.py
+++ b/src/service/init.py
--- a/src/service/dialog_policy.py
+++ b/src/service/dialog_policy.py
@ -1,11 +1,8 @@
 from model.frame import Frame

 class DialogPolicy:
-    def __init__(self, frames: list[Frame]) -> None:
-        self.frames = frames
-
-    def next_dialogue_act(self) -> Frame:
-        if self.frames[-1].act == "welcomemsg":
+    def next_dialogue_act(self, frames: list[Frame]) -> Frame:
+        if frames[-1].act == "welcomemsg":
            return Frame("system", "welcomemsg", [])
        else:
            return Frame("system", "canthelp", [])
--- a/src/service/natural_languag_understanding.py
+++ b/src/service/natural_languag_understanding.py
@ -1,14 +1,92 @@
+from flair.models import SequenceTagger
+from utils.nlu_utils import predict_single, predict_and_annotate
+from model.frame import Frame, Slot
+
+"""
+ACTS:
+    inform/order
+    request/menu
+    inform/address
+    request/price
+    request/ingredients
+    request/sauce
+    inform/phone
+    inform/order-complete
+    request/time
+    request/size
+    welcomemsg
+    affirm
+    inform/delivery
+    inform/payment
+    request/delivery-price
+    bye
+    inform/time
+    request/drinks
+    inform/name
+    negate
+
+SLOTS:
+    food
+    pizza
+    size
+    address
+    quantity
+    ingredient
+    payment-method
+    delivery
+    drink
+    ingredient/neg
+    name
+    phone
+    sauce
+"""
+
 class NaturalLanguageUnderstanding:
+    def __init__(self):
+        print("\n========================================================")
+        print("Models are loading, it may take a moment, please wait...")
+        print("========================================================\n")

-    dictionary = {
-        "Cześć," : "welcomemsg()",
-        "imię?" : "request(name)"
-    }
+        self.frame_model = SequenceTagger.load('frame-model-prod/best-model.pt')
+        self.slot_model = SequenceTagger.load('slot-model-prod/best-model.pt')

-    def convert_text_to_frame(self, text: str):
-        frame = ""
-        text = text.split(" ")
-        for word in text:
-            if(word in self.dictionary):
-                    frame+=self.dictionary[word]+"&"
-        return frame[0:-1]
+        print("\n========================================================")
+        print("Models loaded. NLU system is ready.")
+        print("========================================================\n")
+    
+    def __predict_intention(self, text: str):
+        return predict_single(self.frame_model, text.split(), 'frame')
+
+    def __predict_slot(self, text: str):
+        anootations = predict_and_annotate(self.slot_model, text.split(), 'slot')
+        current_slot = None
+        current_slot_value = ""
+        slots = []
+
+        for annotation in anootations:
+            form = annotation["form"]
+            slot = annotation["slot"]
+
+            if slot[0:2] == "B-":
+                if current_slot != None:
+                    slots.append(Slot(name=current_slot, value=current_slot_value))
+                current_slot = slot[2:]
+                current_slot_value = form
+            elif slot[0:2] == "I-":
+                current_slot_value = current_slot_value + " " + form
+            elif slot == "O":
+                if current_slot != None:
+                    slots.append(Slot(name=current_slot, value=current_slot_value))
+                    current_slot = None
+                    current_slot_value = ""
+
+        if current_slot != None:
+            slots.append(Slot(name=current_slot, value=current_slot_value))
+
+        return slots
+
+    def process_input(self, text: str):
+        act = self.__predict_intention(text)
+        slots = self.__predict_slot(text)
+        frame = Frame(source = 'user', act = act, slots = slots)
+        return frame
--- a/src/service/natural_language_generation.py
+++ b/src/service/natural_language_generation.py
@ -1,5 +1,5 @@
 class NaturalLanguageGeneration:
-    def __init__(self, name):
+    def __init__(self):
        self.name = ["Michał"]

    def respond_to_name_query(self, question):
--- a/src/utils/init.py
+++ b/src/utils/init.py
--- a/src/utils/nlu_utils.py
+++ b/src/utils/nlu_utils.py
@ -69,7 +69,6 @@ def predict_single(model, sentence, label_type):
    csentence = __csentence(sentence, label_type)
    fsentence = __predict(model, csentence)
    intent = {}
-
    for span in fsentence.get_spans(label_type):
        tag = span.get_label(label_type).value
        if tag in intent: