System_Dialogowy_Janet/Code/Create_lists.py

29 lines
641 B
Python
Raw Normal View History

2021-05-17 11:27:13 +02:00
import pandas as pd
import numpy as np
file1 = open('Janet.conllu', 'r')
Lines = file1.readlines()
texts = []
intents = []
count = 0
# Strips the newline character
for line in Lines:
count += 1
if(line.startswith('# text')):
p_line = line.strip()
print("Line{}: {}".format(count, p_line[8:]))
texts.append(p_line[8:])
if(line.startswith('# intent')):
x_line = line.strip()
print("Line{}: {}".format(count, x_line[10:]))
intents.append(x_line[10:])
data = {'Text':texts, 'Intent':intents}
df = pd.DataFrame(data)
print(df.head(5))
2021-05-17 12:03:10 +02:00
df.to_csv(r'data.tsv',index=False, sep='\t')