ium_434704/training.py

48 lines
1.3 KiB
Python
Raw Normal View History

import sys
2021-05-13 22:20:25 +02:00
import pandas as pd
import numpy as np
import tensorflow as tf
import os.path
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.layers.experimental import preprocessing
arguments = sys.argv[1:]
2021-05-15 03:00:10 +02:00
verbose = arguments[0]
epochs = arguments[1]
2021-05-13 22:20:25 +02:00
pd.set_option("display.max_columns", None)
# Wczytanie danych
2021-05-14 00:58:33 +02:00
train_data = pd.read_csv("./MoviesOnStreamingPlatforms_updated.train")
2021-05-13 22:20:25 +02:00
# Stworzenie modelu
columns_to_use = ['Year', 'Runtime', 'Netflix']
train_X = tf.convert_to_tensor(train_data[columns_to_use])
train_Y = tf.convert_to_tensor(train_data[["IMDb"]])
normalizer = preprocessing.Normalization(input_shape=[3,])
normalizer.adapt(train_X)
if os.path.isdir('linear_regression'):
model = keras.models.load_model('linear_regression')
else:
model = keras.Sequential([
keras.Input(shape=(len(columns_to_use),)),
normalizer,
2021-05-14 04:01:11 +02:00
layers.Dense(30, activation='relu'),
layers.Dense(10, activation='relu'),
layers.Dense(25, activation='relu'),
2021-05-13 22:20:25 +02:00
layers.Dense(1)
])
model.compile(loss='mean_absolute_error',
2021-05-14 04:01:11 +02:00
optimizer=tf.keras.optimizers.Adam(0.001),
metrics=[tf.keras.metrics.RootMeanSquaredError()])
2021-05-13 22:20:25 +02:00
2021-05-14 04:01:11 +02:00
model.fit(train_X, train_Y, verbose=verbose, epochs=epochs)
2021-05-13 22:20:25 +02:00
2021-05-14 04:01:11 +02:00
model.save('linear_regression.h5')