forked from kubapok/retroc2
final
This commit is contained in:
parent
8359c05a74
commit
c2b77f7492
40000
dev-0/out.tsv
40000
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
23126
dev-1/out.tsv
23126
dev-1/out.tsv
File diff suppressed because it is too large
Load Diff
@ -2,7 +2,7 @@
|
|||||||
"cells": [
|
"cells": [
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": 1,
|
"execution_count": 5,
|
||||||
"id": "8f5480f9-fa82-4150-acff-9309fdc43690",
|
"id": "8f5480f9-fa82-4150-acff-9309fdc43690",
|
||||||
"metadata": {},
|
"metadata": {},
|
||||||
"outputs": [
|
"outputs": [
|
||||||
@ -13,7 +13,7 @@
|
|||||||
" ('linearregression', LinearRegression())])"
|
" ('linearregression', LinearRegression())])"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
"execution_count": 1,
|
"execution_count": 5,
|
||||||
"metadata": {},
|
"metadata": {},
|
||||||
"output_type": "execute_result"
|
"output_type": "execute_result"
|
||||||
}
|
}
|
||||||
@ -28,6 +28,7 @@
|
|||||||
"with open('train/train.tsv', 'r', encoding='utf8') as file:\n",
|
"with open('train/train.tsv', 'r', encoding='utf8') as file:\n",
|
||||||
" train_data = pd.read_csv(file, sep='\\t', names=['Begin', 'End', 'Title', 'Publisher', 'Text'])\n",
|
" train_data = pd.read_csv(file, sep='\\t', names=['Begin', 'End', 'Title', 'Publisher', 'Text'])\n",
|
||||||
"\n",
|
"\n",
|
||||||
|
"train_data = train_data[:20000] \n",
|
||||||
" \n",
|
" \n",
|
||||||
"X = train_data['Text']\n",
|
"X = train_data['Text']\n",
|
||||||
"Y = train_data['Begin']\n",
|
"Y = train_data['Begin']\n",
|
||||||
@ -39,7 +40,7 @@
|
|||||||
},
|
},
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": 2,
|
"execution_count": 6,
|
||||||
"id": "02e89f1c-a2d0-4d41-94a2-aa86b257069d",
|
"id": "02e89f1c-a2d0-4d41-94a2-aa86b257069d",
|
||||||
"metadata": {},
|
"metadata": {},
|
||||||
"outputs": [],
|
"outputs": [],
|
||||||
@ -61,7 +62,7 @@
|
|||||||
},
|
},
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": 3,
|
"execution_count": null,
|
||||||
"id": "b85f5e22-eafb-41ee-aa2c-20c338d42701",
|
"id": "b85f5e22-eafb-41ee-aa2c-20c338d42701",
|
||||||
"metadata": {},
|
"metadata": {},
|
||||||
"outputs": [],
|
"outputs": [],
|
||||||
|
2
run.py
2
run.py
@ -23,7 +23,7 @@ def write_pred(filename, predictions):
|
|||||||
|
|
||||||
|
|
||||||
|
|
||||||
# train_data = train_data[:10000]
|
train_data = train_data[:10000]
|
||||||
|
|
||||||
X = train_data['Text']
|
X = train_data['Text']
|
||||||
Y = train_data['Begin']
|
Y = train_data['Begin']
|
||||||
|
28440
test-A/out.tsv
28440
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
Loading…
Reference in New Issue
Block a user