Update for the new version
This commit is contained in:
parent
8acd615fdb
commit
90adf994db
19048
dev-0/out.tsv
19048
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
4
gonito.yaml
Normal file
4
gonito.yaml
Normal file
@ -0,0 +1,4 @@
|
|||||||
|
description: tfidf with linear regression
|
||||||
|
tags:
|
||||||
|
- linear-regression
|
||||||
|
- tf-idf
|
18998
test-A/out.tsv
18998
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
@ -10,6 +10,8 @@ import random
|
|||||||
import pickle
|
import pickle
|
||||||
import sys
|
import sys
|
||||||
|
|
||||||
|
import lzma
|
||||||
|
|
||||||
def tokenizer_space(text):
|
def tokenizer_space(text):
|
||||||
return text.split(' ')
|
return text.split(' ')
|
||||||
|
|
||||||
@ -19,9 +21,9 @@ type = sys.argv[1] # 1 or 2
|
|||||||
def run():
|
def run():
|
||||||
|
|
||||||
# LOADING DATA
|
# LOADING DATA
|
||||||
train_text = [a.rstrip('\n') for a in open('../train/in.tsv','r')]
|
train_text = [a.rstrip('\n') for a in lzma.open('../train/in.tsv.xz', 'rt')]
|
||||||
dev_text = [a.rstrip('\n') for a in open('../dev-0/in.tsv','r')]
|
dev_text = [a.rstrip('\n') for a in lzma.open('../dev-0/in.tsv.xz', 'rt')]
|
||||||
test_text = [a.rstrip('\n') for a in open('../test-A/in.tsv','r')]
|
test_text = [a.rstrip('\n') for a in lzma.open('../test-A/in.tsv.xz', 'rt')]
|
||||||
global lowest
|
global lowest
|
||||||
|
|
||||||
train_year = [float(a.rstrip('\n')) for a in open(f'../train/expected{type}.tsv','r')]
|
train_year = [float(a.rstrip('\n')) for a in open(f'../train/expected{type}.tsv','r')]
|
||||||
|
Loading…
Reference in New Issue
Block a user