Update for the new version
This commit is contained in:
parent
8acd615fdb
commit
90adf994db
19048
dev-0/out.tsv
19048
dev-0/out.tsv
File diff suppressed because it is too large
Load Diff
4
gonito.yaml
Normal file
4
gonito.yaml
Normal file
@ -0,0 +1,4 @@
|
||||
description: tfidf with linear regression
|
||||
tags:
|
||||
- linear-regression
|
||||
- tf-idf
|
18998
test-A/out.tsv
18998
test-A/out.tsv
File diff suppressed because it is too large
Load Diff
@ -10,18 +10,20 @@ import random
|
||||
import pickle
|
||||
import sys
|
||||
|
||||
import lzma
|
||||
|
||||
def tokenizer_space(text):
|
||||
return text.split(' ')
|
||||
|
||||
type = sys.argv[1] # 1 or 2
|
||||
type = sys.argv[1] # 1 or 2
|
||||
|
||||
|
||||
def run():
|
||||
|
||||
# LOADING DATA
|
||||
train_text = [a.rstrip('\n') for a in open('../train/in.tsv','r')]
|
||||
dev_text = [a.rstrip('\n') for a in open('../dev-0/in.tsv','r')]
|
||||
test_text = [a.rstrip('\n') for a in open('../test-A/in.tsv','r')]
|
||||
train_text = [a.rstrip('\n') for a in lzma.open('../train/in.tsv.xz', 'rt')]
|
||||
dev_text = [a.rstrip('\n') for a in lzma.open('../dev-0/in.tsv.xz', 'rt')]
|
||||
test_text = [a.rstrip('\n') for a in lzma.open('../test-A/in.tsv.xz', 'rt')]
|
||||
global lowest
|
||||
|
||||
train_year = [float(a.rstrip('\n')) for a in open(f'../train/expected{type}.tsv','r')]
|
||||
|
Loading…
Reference in New Issue
Block a user