This commit is contained in:
Sebastian 2022-05-18 00:51:36 +02:00
parent c3d349bf38
commit f6a8309517
5 changed files with 34225 additions and 34225 deletions

View File

@ -44,7 +44,7 @@
"source": [ "source": [
"train = pd.read_csv('train/train.tsv', header=None, sep='\\t', error_bad_lines=False)\n", "train = pd.read_csv('train/train.tsv', header=None, sep='\\t', error_bad_lines=False)\n",
"print(len(train))\n", "print(len(train))\n",
"train = train.head(30000)" "train = train.head(40000)"
] ]
}, },
{ {
@ -122,7 +122,7 @@
"name": "stdout", "name": "stdout",
"output_type": "stream", "output_type": "stream",
"text": [ "text": [
"4261.093474053155\n" "4289.2810262872745\n"
] ]
} }
], ],

File diff suppressed because it is too large Load Diff

View File

@ -44,7 +44,7 @@
"source": [ "source": [
"train = pd.read_csv('train/train.tsv', header=None, sep='\\t', error_bad_lines=False)\n", "train = pd.read_csv('train/train.tsv', header=None, sep='\\t', error_bad_lines=False)\n",
"print(len(train))\n", "print(len(train))\n",
"train = train.head(30000)" "train = train.head(40000)"
] ]
}, },
{ {
@ -122,7 +122,7 @@
"name": "stdout", "name": "stdout",
"output_type": "stream", "output_type": "stream",
"text": [ "text": [
"4261.093474053155\n" "4289.2810262872745\n"
] ]
} }
], ],

2
run.py
View File

@ -19,7 +19,7 @@ from sklearn.pipeline import make_pipeline
train = pd.read_csv('train/train.tsv', header=None, sep='\t', error_bad_lines=False) train = pd.read_csv('train/train.tsv', header=None, sep='\t', error_bad_lines=False)
print(len(train)) print(len(train))
train = train.head(30000) train = train.head(40000)
# In[3]: # In[3]:

File diff suppressed because it is too large Load Diff