s444476 - add more characteristic words
This commit is contained in:
parent
431761f6f5
commit
eb5a10172e
52728
dev-0/out.tsv
52728
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
61244
dev-1/out.tsv
61244
dev-1/out.tsv
File diff suppressed because it is too large
Load Diff
15
run.py
15
run.py
@ -1,10 +1,13 @@
|
||||
import random
|
||||
|
||||
man_words_list = ['silnik', 'windows', 'silnika', 'gb', 'mb', 'meczu', 'pc', 'opony', 'apple', 'iphone', 'zwiastuny', 'hd',
|
||||
'ubuntu', 'systemu', 'serwer']
|
||||
man_list = ['silnik', 'windows', 'silnika', 'gb', 'mb', 'meczu', 'pc', 'opony', 'apple', 'iphone', 'zwiastuny', 'hd',
|
||||
'ubuntu', 'systemu', 'serwer', "samoch", 'kompute', 'pc', 'sport', 'km', 'paliw', 'kierownic',
|
||||
'piw', 'koleg', 'śrub', 'mecz']
|
||||
|
||||
woman_words_list = ['ciąży', 'miesiączki', 'ciasto', 'ciążę', 'zadowolona', 'ciąża', 'ciazy', 'antykoncepcyjne', 'ginekologa',
|
||||
'tabletki', 'porodzie', 'mąż', 'miesiączkę', 'krwawienie', 'ciasta']
|
||||
woman_list = ['ciąży', 'miesiączki', 'ciasto', 'ciążę', 'zadowolona', 'ciąża', 'ciazy', 'antykoncepcyjne', 'ginekologa',
|
||||
'tabletki', 'porodzie', 'mąż', 'miesiączkę', 'krwawienie', 'ciasta', 'fryzjer', 'kosmety', 'biżuter', 'sukienk',
|
||||
'kolczy', 'obcas', 'bransolet', 'spink', 'torebk', 'szmink', 'kobiet', 'koleżan', 'kuchni', 'gotowa', 'przepis',
|
||||
'miesiączk']
|
||||
|
||||
def classificator(path_in, path_out):
|
||||
result = []
|
||||
@ -13,11 +16,11 @@ def classificator(path_in, path_out):
|
||||
for line in lines:
|
||||
counter_man = 0
|
||||
counter_woman = 0
|
||||
for word in man_words_list:
|
||||
for word in man_list:
|
||||
if word in line:
|
||||
counter_man += 1
|
||||
|
||||
for word in woman_words_list:
|
||||
for word in woman_list:
|
||||
if word in line:
|
||||
counter_woman += 1
|
||||
|
||||
|
51364
test-A/out.tsv
51364
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue
Block a user