forked from kubapok/retroc2
final
This commit is contained in:
parent
8359c05a74
commit
c2b77f7492
40000
dev-0/out.tsv
40000
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
23126
dev-1/out.tsv
23126
dev-1/out.tsv
File diff suppressed because it is too large
Load Diff
@ -2,7 +2,7 @@
|
||||
"cells": [
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 1,
|
||||
"execution_count": 5,
|
||||
"id": "8f5480f9-fa82-4150-acff-9309fdc43690",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
@ -13,7 +13,7 @@
|
||||
" ('linearregression', LinearRegression())])"
|
||||
]
|
||||
},
|
||||
"execution_count": 1,
|
||||
"execution_count": 5,
|
||||
"metadata": {},
|
||||
"output_type": "execute_result"
|
||||
}
|
||||
@ -28,6 +28,7 @@
|
||||
"with open('train/train.tsv', 'r', encoding='utf8') as file:\n",
|
||||
" train_data = pd.read_csv(file, sep='\\t', names=['Begin', 'End', 'Title', 'Publisher', 'Text'])\n",
|
||||
"\n",
|
||||
"train_data = train_data[:20000] \n",
|
||||
" \n",
|
||||
"X = train_data['Text']\n",
|
||||
"Y = train_data['Begin']\n",
|
||||
@ -39,7 +40,7 @@
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 2,
|
||||
"execution_count": 6,
|
||||
"id": "02e89f1c-a2d0-4d41-94a2-aa86b257069d",
|
||||
"metadata": {},
|
||||
"outputs": [],
|
||||
@ -61,7 +62,7 @@
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 3,
|
||||
"execution_count": null,
|
||||
"id": "b85f5e22-eafb-41ee-aa2c-20c338d42701",
|
||||
"metadata": {},
|
||||
"outputs": [],
|
||||
|
2
run.py
2
run.py
@ -23,7 +23,7 @@ def write_pred(filename, predictions):
|
||||
|
||||
|
||||
|
||||
# train_data = train_data[:10000]
|
||||
train_data = train_data[:10000]
|
||||
|
||||
X = train_data['Text']
|
||||
Y = train_data['Begin']
|
||||
|
28440
test-A/out.tsv
28440
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue
Block a user