changed neural network to CNN and added some tests

added functions for loading images, model and testing
added useful functions for tile selection and more
2024-05-26 23:28:22 +02:00 · 2024-05-26 19:56:18 +02:00 · 2024-05-26 19:54:46 +02:00
18 changed files with 84 additions and 32 deletions
--- a/source/NN/pycache/model.cpython-311.pyc
+++ b/source/NN/pycache/model.cpython-311.pyc
--- a/source/NN/pycache/neural_network.cpython-311.pyc
+++ b/source/NN/pycache/neural_network.cpython-311.pyc
--- a/source/NN/model.py
+++ b/source/NN/model.py
@ -3,16 +3,26 @@ import torch
 import torch.nn.functional as F


-class Neural_Network_Model(nn.Module):
-    def __init__(self, num_classes=5,hidden_layer1 = 100,hidden_layer2 = 100):
-        super(Neural_Network_Model, self).__init__()
-        self.fc1 = nn.Linear(150*150*3,hidden_layer1)
+class Conv_Neural_Network_Model(nn.Module):
+    def __init__(self, num_classes=5,hidden_layer1 = 512,hidden_layer2 = 256):
+        super(Conv_Neural_Network_Model, self).__init__()
+        
+        self.conv1 = nn.Conv2d(in_channels=3, out_channels=32, kernel_size=3, stride=1, padding=1)
+        self.pool1 = nn.MaxPool2d(kernel_size=2, stride=2, padding=0)
+        self.conv2 = nn.Conv2d(in_channels=32, out_channels=64, kernel_size=3, stride=1, padding=1)
+        self.pool2 = nn.MaxPool2d(kernel_size=2, stride=2, padding=0)
+        self.conv3 = nn.Conv2d(in_channels=64, out_channels=128, kernel_size=3, stride=1, padding=1)
+        self.pool3 = nn.MaxPool2d(kernel_size=2, stride=2, padding=0)
+
+        self.fc1 = nn.Linear(128*12*12,hidden_layer1)
        self.fc2 = nn.Linear(hidden_layer1,hidden_layer2)
        self.out = nn.Linear(hidden_layer2,num_classes)
-# two hidden layers

    def forward(self, x):
-        x = x.view(-1, 150*150*3)
+        x = self.pool1(F.relu(self.conv1(x)))
+        x = self.pool2(F.relu(self.conv2(x)))
+        x = self.pool3(F.relu(self.conv3(x)))
+        x = x.view(-1, 128*12*12) #<----flattening the image
        x = self.fc1(x)
        x = torch.relu(x)
        x = self.fc2(x)
--- a/source/NN/neural_network.py
+++ b/source/NN/neural_network.py
@ -4,7 +4,6 @@ from torch.utils.data import DataLoader
 from torchvision import datasets, transforms, utils
 from torchvision.transforms import Compose, Lambda, ToTensor
 import matplotlib.pyplot as plt
-import numpy as np
 from model import *
 from PIL import Image

@ -12,9 +11,9 @@ device = torch.device('cuda')

 #data transform to tensors:
 data_transformer = transforms.Compose([
-    transforms.Resize((150, 150)),  
+    transforms.Resize((100, 100)), 
    transforms.ToTensor(),  
-    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))  
+    transforms.Normalize((0.5, 0.5, 0.5 ), (0.5, 0.5, 0.5))  
    ])


@ -24,18 +23,13 @@ test_set = datasets.ImageFolder(root='resources/test', transform=data_transforme


 #to mozna nawet przerzucic do funkcji train:
-#train_loader = DataLoader(train_set, batch_size=32, shuffle=True, num_workers=2)
-#test_loader = DataLoader(test_set, batch_size=32, shuffle=True, num_workers=2)
-
-#test if classes work properly:
-#print(train_set.classes)
-#print(train_set.class_to_idx)
-#print(train_set.targets[3002])
+# train_loader = DataLoader(train_set, batch_size=64, shuffle=True)
+#test_loader = DataLoader(test_set, batch_size=32, shuffle=True)


 #function for training model
 def train(model, dataset, iter=100, batch_size=64):
-    optimizer = torch.optim.SGD(model.parameters(), lr=0.01)
+    optimizer = torch.optim.SGD(model.parameters(), lr=0.001)
    criterion = nn.NLLLoss()
    train_loader = DataLoader(dataset, batch_size=batch_size, shuffle=True)
    model.train()
@ -62,14 +56,12 @@ def accuracy(model, dataset):
    return correct.float() / len(dataset)


-
-
-
-model = Neural_Network_Model()
+model = Conv_Neural_Network_Model()
 model.to(device)

-model.load_state_dict(torch.load('model.pth'))
-model.eval()
+#loading the already saved model:
+# model.load_state_dict(torch.load('model.pth'))
+# model.eval()

 #training the model:
 # train(model, train_set)
@ -77,14 +69,42 @@ model.eval()
 # torch.save(model.state_dict(), 'model.pth')


+
+def load_model():
+    model = Conv_Neural_Network_Model()
+    model.load_state_dict(torch.load('CNN_model.pth'))
+    model.eval()
+    return model
+
+
+def load_image(image_path):
+    testImage = Image.open(image_path)
+    testImage = data_transformer(testImage)
+    testImage = testImage.unsqueeze(0)
+    return testImage
+
+def guess_image(model, image_tensor):
+    with torch.no_grad():
+        testOutput = model(image_tensor)
+        _, predicted = torch.max(testOutput, 1)
+        predicted_class = train_set.classes[predicted.item()]
+    return predicted_class
+
+
+
+# image_path = 'resources/images/plant_photos/pexels-dxt-73640.jpg'
+# image_tensor = load_image(image_path)
+# prediction = guess_image(load_model(), image_tensor)
+# print(f"The predicted image is: {prediction}")
+
 #TEST - loading the image and getting results:
-testImage_path = 'resources/images/plant_photos/pexels-polina-tankilevitch-4110456.jpg'
+testImage_path = 'resources/images/plant_photos/pexels-justus-menke-3490295-5213970.jpg'
 testImage = Image.open(testImage_path)
 testImage = data_transformer(testImage)
 testImage = testImage.unsqueeze(0)
 testImage = testImage.to(device)

-model.load_state_dict(torch.load('model.pth'))
+model.load_state_dict(torch.load('CNN_model.pth'))
 model.to(device)
 model.eval()

@ -92,4 +112,3 @@ testOutput = model(testImage)
 _, predicted = torch.max(testOutput, 1)
 predicted_class = train_set.classes[predicted.item()]
 print(f'The predicted class is: {predicted_class}')
-
--- a/source/pycache/astar.cpython-311.pyc
+++ b/source/pycache/astar.cpython-311.pyc
--- a/source/pycache/bfs.cpython-311.pyc
+++ b/source/pycache/bfs.cpython-311.pyc
--- a/source/pycache/crop_protection_product.cpython-311.pyc
+++ b/source/pycache/crop_protection_product.cpython-311.pyc
--- a/source/pycache/ground.cpython-311.pyc
+++ b/source/pycache/ground.cpython-311.pyc
--- a/source/pycache/plant.cpython-311.pyc
+++ b/source/pycache/plant.cpython-311.pyc
--- a/source/pycache/tile.cpython-311.pyc
+++ b/source/pycache/tile.cpython-311.pyc
--- a/source/area/pycache/init.cpython-311.pyc
+++ b/source/area/pycache/init.cpython-311.pyc
--- a/source/area/pycache/constants.cpython-311.pyc
+++ b/source/area/pycache/constants.cpython-311.pyc
--- a/source/area/pycache/field.cpython-311.pyc
+++ b/source/area/pycache/field.cpython-311.pyc
--- a/source/area/pycache/tractor.cpython-311.pyc
+++ b/source/area/pycache/tractor.cpython-311.pyc
--- a/source/area/field.py
+++ b/source/area/field.py
@ -53,3 +53,10 @@ def get_tile_coordinates(index):
        return tile.x, tile.y
    else:
        return None
+    
+def get_tile_index():
+    valid_indices = []
+    for index, tile in enumerate(tiles):
+        if tile.image=="resources/images/sampling.png":
+            valid_indices.append(index)
+    return random.choice(valid_indices)
--- a/source/main.py
+++ b/source/main.py
@ -3,16 +3,17 @@ import time
 import random
 import pandas as pd
 import joblib
-
 from area.constants import WIDTH, HEIGHT, TILE_SIZE
 from area.field import drawWindow
 from area.tractor import Tractor, do_actions
 from area.field import tiles, fieldX, fieldY
-from area.field import get_tile_coordinates
+from area.field import get_tile_coordinates, get_tile_index
 from ground import Dirt
 from plant import Plant
 from bfs import graphsearch, Istate, succ
 from astar import a_star
+from NN.neural_network import load_model, load_image, guess_image
+
 WIN = pygame.display.set_mode((WIDTH, HEIGHT))
 pygame.display.set_caption('Intelligent tractor')

@ -23,7 +24,7 @@ def main():
    pygame.display.update()

 #getting coordinates of our "goal tile":
-    tile_index=127
+    tile_index = get_tile_index()
    tile_x, tile_y = get_tile_coordinates(tile_index)
    if tile_x is not None and tile_y is not None:
        print(f"Coordinates of tile {tile_index} are: ({tile_x}, {tile_y})")
@ -128,6 +129,13 @@ def main():
        print(predykcje)
        if predykcje == 'work':
            tractor.work_on_field(tile1, d1, p1)
+
+        #guessing the image under the tile:
+        tiles[tile_index].display_photo()
+        image_path = tiles[tile_index].photo
+        image_tensor = load_image(image_path)
+        prediction = guess_image(load_model(), image_tensor)
+        print(f"The predicted image is: {prediction}")
        time.sleep(30)
        print("\n")

--- a/source/model.pth
+++ b/source/model.pth
--- a/source/tile.py
+++ b/source/tile.py
@ -1,5 +1,8 @@
 import random
 import os
+import numpy as np
+import matplotlib.pyplot as plt
+from PIL import Image

 # path to plant images folder (used in randomize_photo function)
 folder_path = "resources/images/plant_photos"
@ -48,4 +51,9 @@ class Tile:
            self.image = "resources/images/rock_dirt.png"


-# DISCLAMER check column and choose plant type ("potato","wheat" etc.)
+    def display_photo(self):
+        image_path = self.photo
+        img = Image.open(image_path)
+        plt.imshow(img)
+        plt.axis('off')
+        plt.show()
Author	SHA1	Message	Date
MarRac	9667655a2a	changed neural network to CNN and added some tests	2024-05-26 23:28:22 +02:00
MarRac	b45c2e0f1f	added functions for loading images, model and testing	2024-05-26 19:56:18 +02:00
MarRac	fb0ec5057c	added useful functions for tile selection and more	2024-05-26 19:54:46 +02:00