71 lines
2.8 KiB
Python
71 lines
2.8 KiB
Python
import random
|
|
|
|
woman_words = ['ciąży', 'miesiączki', 'ciasto', 'ciążę', 'zadowolona', 'ciąża', 'ciazy', 'antykoncepcyjne',
|
|
'ginekologa', 'wysublimowany', 'płakałam', 'płakać', 'depresja', 'tabletki', 'depresje', 'porodzie',
|
|
'mąż', 'misiek', 'miesiączkę', 'krwawienie', 'ciasta', ':)',
|
|
'Shih', 'Tzu', 'troszkę', 'julkaust@wp.pl', 'wigoru.', 'młodej', 'kolezanka', 'kolezankami', 'koleżanką',
|
|
'przyjaciółki', 'przyjaciółka', 'przyjaciółkami', 'pomadka',
|
|
'kosmetyczka', 'okres', 'paznokcie', 'włosy', 'usta', 'lekarz', 'lekarza', 'dziecko', 'dzieci', 'wino', 'sukienka',
|
|
'sukienke', 'torebka', 'torebkę', 'makijaż', 'pomadka', 'wesele', 'slub', 'weselu']
|
|
|
|
man_words = ['windows', 'gb', 'mb', 'meczu', 'pc', 'opony', 'apple', 'iphone', 'zwiast', 'hd', 'ubunt',
|
|
'system', 'serwer', 'youtub', 'sfd', 'kfd', 'elektr', 'autoce', 'dobrep', 'merced', 'bmw',
|
|
'audi', 'porsch', 'gry', 'gra','gram', 'cs', 'counte', 'piłka', 'mecz', 'gol', 'bramka', 'linux',
|
|
'robota','felga','lagi' 'żona', 'żona', 'żony', 'żonie', 'żoną', 'zona', 'zony', 'zonie', 'komput', 'inform'
|
|
'sserwer', 'ziom', 'ziomków', 'ziomkow', 'kumpel', 'kolega', 'kolegą', 'kolegi', 'pad']
|
|
|
|
def normalize(woman_words, man_words):
|
|
woman_norm = []
|
|
man_norm = []
|
|
for i in woman_words:
|
|
woman_norm.append(i.lower())
|
|
for i in man_words:
|
|
man_norm.append(i.lower())
|
|
return woman_norm, man_norm
|
|
|
|
def guess(woman_words_norm, man_words_norm, dane):
|
|
result = []
|
|
for s in dane:
|
|
man_count = 0
|
|
woman_count = 0
|
|
t = s.split()
|
|
for w in t:
|
|
if w in man_words_norm:
|
|
man_count += 1
|
|
elif w in woman_words_norm:
|
|
woman_count += 1
|
|
if man_count >= woman_count:
|
|
result.append('1')
|
|
else:
|
|
result.append('0')
|
|
return result
|
|
|
|
woman_words_norm, man_words_norm = normalize(woman_words, man_words)
|
|
|
|
dane1 = []
|
|
with open('dev-0/in.tsv') as data:
|
|
for idx, line in enumerate(data.readlines()):
|
|
dane1.append(line.replace('\n', ''))
|
|
result1 = guess(woman_words_norm, man_words_norm, dane1)
|
|
with open('dev-0/out.tsv', 'w') as file:
|
|
for r in result1:
|
|
file.write(r + "\n")
|
|
|
|
dane2 = []
|
|
with open('dev-1/in.tsv') as data:
|
|
for idx, line in enumerate(data.readlines()):
|
|
dane2.append(line.replace('\n', ''))
|
|
result2 = guess(woman_words_norm, man_words_norm, dane2)
|
|
with open('dev-1/out.tsv', 'w') as file:
|
|
for r in result2:
|
|
file.write(r + "\n")
|
|
|
|
dane3 = []
|
|
with open('test-A/in.tsv') as data:
|
|
for idx, line in enumerate(data.readlines()):
|
|
dane3.append(line.replace('\n', ''))
|
|
result3 = guess(woman_words_norm, man_words_norm, dane3)
|
|
with open('test-A/out.tsv', 'w') as file:
|
|
for r in result3:
|
|
file.write(r + "\n")
|