This commit is contained in:
eugene 2023-06-07 00:34:30 +02:00
parent 1b2296cf4c
commit 3fef5dda76
3 changed files with 158 additions and 0 deletions

View File

@ -11,6 +11,8 @@ RUN pip3 install tensorflow==2.12.*
RUN pip3 install torch torchvision
#RUN pip install torch==1.8.0+cpu torchvision==0.9.0+cpu torchaudio==0.8.0 -f
RUN pip3 install pickle5
RUN pip3 install sacred
RUN pip3 install pymongo
#RUN apt install python3.10-venv -y
#RUN python3 -m venv docker_ium

Jenkinsfile-lab7 Normal file
View File

@ -0,0 +1,55 @@
pipeline {
agent {
dockerfile true
stages {
stage('do nothing')
steps {
echo ("do nothing")
/*echo ("set up venv")
sh "python3 -m venv docker_ium"
sh "source docker_ium/bin/activate"
sh "pip3 install kaggle"
sh "pip3 install pandas"
sh "pip3 install -U scikit-learn"*/
stage('Run Script') {
steps {
//echo ("checkout: check out from version control")
//git ""
//echo ("sh: Shell Script")
//sh "python3"
//echo ("copyArtifacts")
//echo ("run dockerfile")
//sh docker
echo("run data script")
//sh "source docker_ium/bin/activate"
sh "ls -a"
sh "chmod u+x"
//sh "pip3 show pandas"
//sh "python3 | tee output.txt | tar -czf output.tar.gz output.txt"
sh "python3 | tee metrics.txt"
stages {
stage('Archive Output') {
steps {
archiveArtifacts 'experiments/**/*.*'

101 Normal file
View File

@ -0,0 +1,101 @@
import pandas as pd
import torch
import torch.nn as nn
import torch.optim as optim
from import DataLoader, Dataset
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
import pickle
from sacred import Experiment
from sacred.observers import FileStorageObserver, MongoObserver
ex = Experiment("s151636", interactive=True, save_git_info=False)
ex.observers.append(MongoObserver(url='mongodb://admin:IUM_2021@', db_name='sacred'))
# Define the neural network model
class Model(nn.Module):
def __init__(self):
super(Model, self).__init__()
self.fc1 = nn.Linear(1, 64)
self.fc2 = nn.Linear(64, 1)
self.relu = nn.ReLU()
def forward(self, x):
x = self.fc1(x)
x = self.relu(x)
x = self.fc2(x)
return x
# Define a custom dataset
class CustomDataset(Dataset):
def __init__(self, X, y):
self.X = torch.FloatTensor(X.values.reshape(-1, 1))
self.y = torch.FloatTensor(y.values.reshape(-1, 1))
def __len__(self):
return len(self.X)
def __getitem__(self, idx):
return self.X[idx], self.y[idx]
def train_model():
# Load the dataset
df = pd.read_csv('data.csv')
# Select the relevant columns (e.g., 'Rating' and 'Writer')
data = df[['Rating', 'Writer']]
# Drop rows with missing values
data = data.dropna()
# Convert the 'Writer' column to numeric using label encoding
encoder = LabelEncoder()
data['Writer'] = encoder.fit_transform(data['Writer'])
# Split the data into training and testing sets
X = data['Writer']
y = data['Rating']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
# Create the model instance
model = Model()
# Define the loss function and optimizer
criterion = nn.MSELoss()
optimizer = optim.Adam(model.parameters())
# Create dataloaders for training and testing
train_dataset = CustomDataset(X_train, y_train)
test_dataset = CustomDataset(X_test, y_test)
train_dataloader = DataLoader(train_dataset, batch_size=64, shuffle=True)
test_dataloader = DataLoader(test_dataset, batch_size=64)
# Train the model
for epoch in range(10):
for inputs, targets in train_dataloader:
outputs = model(inputs)
loss = criterion(outputs, targets)
# Save the model to a file, 'model.pth')
# Save the encoder to a file
with open('encoder.pkl', 'wb') as f:
pickle.dump(encoder, f)
# Make predictions on new data
new_writer = 'Jim Cash'
new_writer_encoded = torch.tensor(encoder.transform([new_writer])).float()
rating_prediction = model(new_writer_encoded)
print("Predicted rating for the writer 'Jim Cash':", rating_prediction.item())