praca-magisterska/project/train.py

#!python3
#!/usr/bin/env python3
import sys
import pickle
import settings

import numpy as np
from keras.layers import Input, Dense, Conv2D, Flatten, LSTM, Dropout, TimeDistributed, RepeatVector, Activation, Bidirectional, Reshape
from keras.models import Model, Sequential
from keras.utils.np_utils import to_categorical


def load_data(samples_path):
    print('Loading... {}'.format(train_data_path))
    train_X = np.load(train_data_path, allow_pickle=True)['arr_0']
    train_y = np.load(train_data_path, allow_pickle=True)['arr_1']
    return train_X, train_y

# TODO: make transformer class with fit, transform and reverse definitions
def preprocess_samples(train_X, train_y):
    vocab_X = np.unique(train_X)
    vocab_y = np.unique(train_y)
    vocab = np.concatenate([vocab_X, vocab_y])
    n_vocab = vocab.shape[0]
    note_to_int = dict((note, number) for number, note in enumerate(vocab))
    int_to_note = dict((number, note) for number, note in enumerate(vocab))
    _train_X = []
    _train_y = []
    for sample in train_X:
        # TODO: add normalizasion
        _train_X.append([note_to_int[note] for note in sample])

    train_X = np.array(_train_X).reshape(train_X.shape[0], train_X.shape[1], 1)
    train_y = np.array([note_to_int[note] for note in train_y]).reshape(-1,1)
    train_y = to_categorical(train_y)

    return train_X, train_y, n_vocab, int_to_note

train_data_path = sys.argv[1]

train_X, train_y = load_data(train_data_path)
train_X, train_y, n_vocab, int_to_note = preprocess_samples(train_X, train_y)

save_model_path = sys.argv[2]
epochs = int(sys.argv[3])

model = Sequential()
model.add(LSTM(512, input_shape=(train_X.shape[1], train_X.shape[2]), return_sequences=True))
model.add(Dropout(0.3))
model.add(LSTM(512, return_sequences=True))
model.add(Dropout(0.3))
model.add(LSTM(512))
model.add(Dense(256))
model.add(Dropout(0.3))
model.add(Dense(n_vocab))
model.add(Activation('softmax'))
model.compile(loss='categorical_crossentropy', optimizer='rmsprop')

# This code will train our model, with given by parameter number of epochs
print('Training...')
model.fit(train_X, train_y, epochs=epochs, batch_size=64)

# it saves model, and additional informations of model 
# that is needed to generate music from it 
pickle.dump(model, open(save_model_path,'wb'))
pickle.dump((int_to_note, n_vocab, train_X.shape[1]), open('{}_dict'.format(save_model_path),'wb'))
print('Done!')
print("Model saved to: {}".format(save_model_path))
add docstrings, fix choose_by_prob 2019-06-19 13:40:35 +02:00			`#!python3`
add #!/usr/bin/env python3 2019-05-29 10:37:29 +02:00			`#!/usr/bin/env python3`
LSTM Music Generator 2019-06-19 15:48:39 +02:00			`import sys`
			`import pickle`
-init-first-stage- 2019-05-28 12:40:26 +02:00			`import settings`
LSTM Music Generator 2019-06-19 15:48:39 +02:00
			`import numpy as np`
lstm - drop this branch, looking for other way to generate music 2019-05-30 11:23:34 +02:00			`from keras.layers import Input, Dense, Conv2D, Flatten, LSTM, Dropout, TimeDistributed, RepeatVector, Activation, Bidirectional, Reshape`
-init-first-stage- 2019-05-28 12:40:26 +02:00			`from keras.models import Model, Sequential`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`from keras.utils.np_utils import to_categorical`
LSTM Music Generator 2019-06-19 15:48:39 +02:00
-init-first-stage- 2019-05-28 12:40:26 +02:00
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`def load_data(samples_path):`
			`print('Loading... {}'.format(train_data_path))`
			`train_X = np.load(train_data_path, allow_pickle=True)['arr_0']`
			`train_y = np.load(train_data_path, allow_pickle=True)['arr_1']`
			`return train_X, train_y`

			`# TODO: make transformer class with fit, transform and reverse definitions`
			`def preprocess_samples(train_X, train_y):`
add docstrings, fix choose_by_prob 2019-06-19 13:40:35 +02:00			`vocab_X = np.unique(train_X)`
			`vocab_y = np.unique(train_y)`
			`vocab = np.concatenate([vocab_X, vocab_y])`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`n_vocab = vocab.shape[0]`
			`note_to_int = dict((note, number) for number, note in enumerate(vocab))`
			`int_to_note = dict((number, note) for number, note in enumerate(vocab))`
			`_train_X = []`
			`_train_y = []`
			`for sample in train_X:`
			`# TODO: add normalizasion`
			`_train_X.append([note_to_int[note] for note in sample])`

			`train_X = np.array(_train_X).reshape(train_X.shape[0], train_X.shape[1], 1)`
			`train_y = np.array([note_to_int[note] for note in train_y]).reshape(-1,1)`
			`train_y = to_categorical(train_y)`

			`return train_X, train_y, n_vocab, int_to_note`

lstm autoencoder, for now with the best results 2019-05-30 12:36:59 +02:00			`train_data_path = sys.argv[1]`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00
			`train_X, train_y = load_data(train_data_path)`
			`train_X, train_y, n_vocab, int_to_note = preprocess_samples(train_X, train_y)`

lstm autoencoder, for now with the best results 2019-05-30 12:36:59 +02:00			`save_model_path = sys.argv[2]`
			`epochs = int(sys.argv[3])`
lstm - drop this branch, looking for other way to generate music 2019-05-30 11:23:34 +02:00
			`model = Sequential()`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`model.add(LSTM(512, input_shape=(train_X.shape[1], train_X.shape[2]), return_sequences=True))`
lstm - drop this branch, looking for other way to generate music 2019-05-30 11:23:34 +02:00			`model.add(Dropout(0.3))`
			`model.add(LSTM(512, return_sequences=True))`
			`model.add(Dropout(0.3))`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`model.add(LSTM(512))`
			`model.add(Dense(256))`
lstm autoencoder, for now with the best results 2019-05-30 12:36:59 +02:00			`model.add(Dropout(0.3))`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`model.add(Dense(n_vocab))`
lstm - drop this branch, looking for other way to generate music 2019-05-30 11:23:34 +02:00			`model.add(Activation('softmax'))`
			`model.compile(loss='categorical_crossentropy', optimizer='rmsprop')`

LSTM Music Generator 2019-06-19 15:48:39 +02:00			`# This code will train our model, with given by parameter number of epochs`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`print('Training...')`
			`model.fit(train_X, train_y, epochs=epochs, batch_size=64)`
lstm - drop this branch, looking for other way to generate music 2019-05-30 11:23:34 +02:00
LSTM Music Generator 2019-06-19 15:48:39 +02:00			`# it saves model, and additional informations of model`
			`# that is needed to generate music from it`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`pickle.dump(model, open(save_model_path,'wb'))`
LSTM Music Generator 2019-06-19 15:48:39 +02:00			`pickle.dump((int_to_note, n_vocab, train_X.shape[1]), open('{}_dict'.format(save_model_path),'wb'))`
get it working, on music21 and sequence style enoding 2019-06-01 17:05:38 +02:00			`print('Done!')`
			`print("Model saved to: {}".format(save_model_path))`