BLUR-15 Zmiana detekcji twarzy na detekcję obiektów. Dodanie klasy dla ramek wokół obiektów. Dodanie wizualizacji.

2023-11-24 21:44:34 +01:00 · 2023-11-24 21:44:34 +01:00 · 7fa6bb231c
commit 7fa6bb231c
parent 87989245b9
3 changed files with 69 additions and 29 deletions
--- a/ml/assets/fonts/arial.ttf
+++ b/ml/assets/fonts/arial.ttf
--- a/ml/element_detection.py
+++ b/ml/element_detection.py
@ -0,0 +1,69 @@
 import os
 from typing import List, Tuple
 import torch
 from PIL import Image, ImageDraw, ImageFont
 from ultralytics import YOLO
 DIR_PATH = os.path.dirname(os.path.realpath(__file__))
 FACES_PATH = os.path.join(DIR_PATH, "assets/weights/yolov8n-face.pt")
 PLATES_PATH = os.path.join(DIR_PATH, "assets/weights/yolov8-plate.pt")
 FACES_MODEL = YOLO(FACES_PATH)
 PLATES_MODEL = YOLO(PLATES_PATH)
 CONF_THRESH = 0.3
 IOU_THRESH = 0.5
 class BoundBox:
    def __init__(self, x1, y1, x2, y2):
        self.x1, self.y1, self.x2, self.y2 = x1, y1, x2, y2
        self.selected = True
    def select(self):
        self.selected = True
    def unselect(self):
        self.selected = False
    def get_params(self) -> Tuple[int, int, int, int]:
        return self.x1, self.y1, self.x2, self.y2
 def detect(image_path: str) -> List[BoundBox]:
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    faces = FACES_MODEL.predict(
        source=image_path, conf=CONF_THRESH, iou=IOU_THRESH, device=device
    )
    faces = faces[0].cpu().numpy().boxes
    plates = PLATES_MODEL.predict(
        source=image_path, conf=CONF_THRESH, iou=IOU_THRESH, device=device
    )
    plates = plates[0].cpu().numpy().boxes
    bounding_boxes = []
    for boxes in [faces, plates]:
        for box in boxes:
            xyxyn = box.xyxy[0]
            x1 = int(xyxyn[0])
            y1 = int(xyxyn[1])
            x2 = int(xyxyn[2])
            y2 = int(xyxyn[3])
            bounding_boxes.append(BoundBox(x1, y1, x2, y2))
    return bounding_boxes
 def show_image_with_boxes(
    in_image_path: str, bounding_boxes: List[BoundBox], out_image_path: str = None
 ):
    img = Image.open(in_image_path)
    draw = ImageDraw.Draw(img)
    font_path = DIR_PATH + "/assets/fonts/arial.ttf"
    font = ImageFont.truetype(font_path, 25)
    for i, box in enumerate(bounding_boxes):
        draw.rectangle(box.get_params(), outline="red", width=2, fill=None)
        draw.text((box.x1 + 5, box.y1 + 5), str(i+1), fill="red", font=font)
    if not out_image_path:
        out_image_path = (
            in_image_path.split(".")[0] + "_out." + in_image_path.split(".")[1]
        )
    img.save(out_image_path)
--- a/ml/face_detection.py
+++ b/ml/face_detection.py
@ -1,29 +0,0 @@
 import os
 from typing import List
 import torch
 from ultralytics import YOLO
 WEIGHTS_PATH = "assets/weights/yolov8n-face.pt"
 DIR_PATH = os.path.dirname(os.path.realpath(__file__))
 WEIGHTS_PATH = os.path.join(DIR_PATH, WEIGHTS_PATH)
 MODEL = YOLO(WEIGHTS_PATH)
 CONF_THRESH = 0.01
 IOU_THRESH = 0.5
 # TODO: currently detect_faces accepts a image path, but it can be changed to accept images in memory
 def detect_faces(image_path: str) -> List[tuple[int, int, int, int]]:
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    results = MODEL.predict(source=image_path, conf=CONF_THRESH, iou=IOU_THRESH, device=device)
    face_boxes = []
    result = results[0].cpu().numpy()
    for box in result.boxes:
        xyxyn = box.xyxy[0]
        x1 = int(xyxyn[0])
        y1 = int(xyxyn[1])
        x2 = int(xyxyn[2])
        y2 = int(xyxyn[3])
        face_boxes.append((x1, y1, x2, y2))
    return face_boxes