SZI2019SmieciarzWmi/VowpalWabbit/generate_dataset.py

39 lines
1.4 KiB
Python
Raw Normal View History

import glob, datetime, os
from VowpalWrapper.wrapper import wrap_ex
2019-06-05 18:21:27 +02:00
def generate_dataset(run_count, clear, model_name, learn):
print("GENERATING DATASET")
if(clear == True):
print("Clearing stored data... ", end = '')
for dfile in glob.glob('./VowpalWabbit/VowpalInputData/input_map*.txt'):
if(os.path.exists(dfile)):
os.remove(dfile)
print("Done")
2019-06-05 18:21:27 +02:00
print("Collecting data from " + str(run_count) + " runs...")
wrap_ex("./VowpalWabbit/vowpal_auto_run.sh "+str(run_count))
print("Collected data")
2019-06-11 19:36:51 +02:00
2019-06-05 18:21:27 +02:00
filename = "./VowpalWabbit/VowpalInputData/input_dataset" + str(datetime.datetime.now().strftime("%m%d%H%M")) + model_name
print("Creating input file " + filename + ".txt... ", end = '')
2019-06-11 19:36:51 +02:00
2019-06-09 08:25:18 +02:00
input_file = open(filename,"a+")
2019-06-05 18:21:27 +02:00
for pfile in glob.glob('./VowpalWabbit/VowpalInputData/input_map*.txt'):
#print(pfile)
partial_input = open(pfile, "r+")
for line in partial_input:
input_file.write(line)
partial_input.close()
input_file.close()
os.rename(filename, filename + ".txt")
print("Done")
2019-06-05 18:21:27 +02:00
if(learn == True):
print("Learning from " + str(filename) + ".txt")
model_file = "./VowpalWabbit/VowpalModels/" + model_name + ".model"
2019-06-11 19:36:51 +02:00
wrap_ex("vw --oaa 5 " + filename + ".txt -f " + model_file)
2019-06-05 18:21:27 +02:00
print("Learning process complete, model saved to " + model_file)
2019-06-11 19:36:51 +02:00
generate_dataset(100, True, "wolmo", True)