change word limit from 400 to 450
This commit is contained in:
parent
00fec94240
commit
ab804f0c9e
@ -31,7 +31,7 @@ for dataset in 'train', 'dev-0':
|
||||
text = text.replace('\\n','')
|
||||
|
||||
text_splitted = text.split(' ')
|
||||
for i in range(0, len(text_splitted), 400):
|
||||
text_chunk = ' '.join(text_splitted[i:i+400])
|
||||
for i in range(0, len(text_splitted), 450):
|
||||
text_chunk = ' '.join(text_splitted[i:i+450])
|
||||
f_hf.write(text_chunk +'\n')
|
||||
|
||||
|
@ -31,8 +31,8 @@ for dataset in 'train', 'dev-0':
|
||||
text = text.replace('\\n','')
|
||||
|
||||
text_splitted = text.split(' ')
|
||||
for i in range(0, len(text_splitted), 400):
|
||||
text_chunk = ' '.join(text_splitted[i:i+400])
|
||||
for i in range(0, len(text_splitted), 450):
|
||||
text_chunk = ' '.join(text_splitted[i:i+450])
|
||||
text_chunk = 'year : ' + year + ' month : ' + month + ' day ' + day_of_month + ' weekday : ' + weekday + ' ' + text_chunk
|
||||
f_hf.write(text_chunk +'\n')
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user