petite-difference-challenge2/run.py

71 lines
2.8 KiB
Python
Raw Normal View History

2022-05-04 12:53:20 +02:00
import random
woman_words = ['ciąży', 'miesiączki', 'ciasto', 'ciążę', 'zadowolona', 'ciąża', 'ciazy', 'antykoncepcyjne',
'ginekologa', 'wysublimowany', 'płakałam', 'płakać', 'depresja', 'tabletki', 'depresje', 'porodzie',
'mąż', 'misiek', 'miesiączkę', 'krwawienie', 'ciasta', ':)',
'Shih', 'Tzu', 'troszkę', 'julkaust@wp.pl', 'wigoru.', 'młodej', 'kolezanka', 'kolezankami', 'koleżanką',
'przyjaciółki', 'przyjaciółka', 'przyjaciółkami', 'pomadka',
'kosmetyczka', 'okres', 'paznokcie', 'włosy', 'usta', 'lekarz', 'lekarza', 'dziecko', 'dzieci', 'wino', 'sukienka',
'sukienke', 'torebka', 'torebkę', 'makijaż', 'pomadka', 'wesele', 'slub', 'weselu']
man_words = ['windows', 'gb', 'mb', 'meczu', 'pc', 'opony', 'apple', 'iphone', 'zwiast', 'hd', 'ubunt',
'system', 'serwer', 'youtub', 'sfd', 'kfd', 'elektr', 'autoce', 'dobrep', 'merced', 'bmw',
'audi', 'porsch', 'gry', 'gra','gram', 'cs', 'counte', 'piłka', 'mecz', 'gol', 'bramka', 'linux',
'robota','felga','lagi' 'żona', 'żona', 'żony', 'żonie', 'żoną', 'zona', 'zony', 'zonie', 'komput', 'inform'
'sserwer', 'ziom', 'ziomków', 'ziomkow', 'kumpel', 'kolega', 'kolegą', 'kolegi', 'pad']
def normalize(woman_words, man_words):
woman_norm = []
man_norm = []
for i in woman_words:
woman_norm.append(i.lower())
for i in man_words:
man_norm.append(i.lower())
return woman_norm, man_norm
def guess(woman_words_norm, man_words_norm, dane):
result = []
for s in dane:
man_count = 0
woman_count = 0
t = s.split()
for w in t:
if w in man_words_norm:
man_count += 1
elif w in woman_words_norm:
woman_count += 1
if man_count >= woman_count:
result.append('1')
else:
result.append('0')
return result
woman_words_norm, man_words_norm = normalize(woman_words, man_words)
dane1 = []
with open('dev-0/in.tsv') as data:
for idx, line in enumerate(data.readlines()):
dane1.append(line.replace('\n', ''))
result1 = guess(woman_words_norm, man_words_norm, dane1)
with open('dev-0/out.tsv', 'w') as file:
for r in result1:
file.write(r + "\n")
dane2 = []
with open('dev-1/in.tsv') as data:
for idx, line in enumerate(data.readlines()):
dane2.append(line.replace('\n', ''))
result2 = guess(woman_words_norm, man_words_norm, dane2)
with open('dev-1/out.tsv', 'w') as file:
for r in result2:
file.write(r + "\n")
dane3 = []
with open('test-A/in.tsv') as data:
for idx, line in enumerate(data.readlines()):
dane3.append(line.replace('\n', ''))
result3 = guess(woman_words_norm, man_words_norm, dane3)
with open('test-A/out.tsv', 'w') as file:
for r in result3:
file.write(r + "\n")