forked from kubapok/retroc2
ver 2 10000 train
This commit is contained in:
parent
a2d5d926d0
commit
9dfe8fe3b5
@ -2399,7 +2399,7 @@
|
|||||||
1882.9509376976243
|
1882.9509376976243
|
||||||
2006.2831425999086
|
2006.2831425999086
|
||||||
1901.8236927643368
|
1901.8236927643368
|
||||||
1845.8431605627075
|
1846.2982848835586
|
||||||
1907.4807609148313
|
1907.4807609148313
|
||||||
1919.1770226218323
|
1919.1770226218323
|
||||||
1808.6714849322975
|
1808.6714849322975
|
||||||
@ -4770,7 +4770,7 @@
|
|||||||
1869.227930644483
|
1869.227930644483
|
||||||
1906.3844663610223
|
1906.3844663610223
|
||||||
1945.3424395378358
|
1945.3424395378358
|
||||||
1897.9459278201575
|
1897.8191028561196
|
||||||
1902.4248382081591
|
1902.4248382081591
|
||||||
1916.941205362806
|
1916.941205362806
|
||||||
1951.3650770196946
|
1951.3650770196946
|
||||||
@ -6336,7 +6336,8 @@
|
|||||||
1974.3692055493452
|
1974.3692055493452
|
||||||
1851.1544441272165
|
1851.1544441272165
|
||||||
1837.2440449549101
|
1837.2440449549101
|
||||||
1921.004623698161
|
1906.469703262039
|
||||||
|
1941.217890583569
|
||||||
1863.050896361201
|
1863.050896361201
|
||||||
1935.4381446070022
|
1935.4381446070022
|
||||||
1838.6591222095797
|
1838.6591222095797
|
||||||
@ -11780,7 +11781,7 @@
|
|||||||
1971.261305356721
|
1971.261305356721
|
||||||
1965.7895878732024
|
1965.7895878732024
|
||||||
1894.1926433945762
|
1894.1926433945762
|
||||||
1843.5769117112493
|
1843.4054815753093
|
||||||
1798.5510049748643
|
1798.5510049748643
|
||||||
1874.6762363908592
|
1874.6762363908592
|
||||||
1933.9946144817523
|
1933.9946144817523
|
||||||
@ -11868,7 +11869,7 @@
|
|||||||
1933.1659502110472
|
1933.1659502110472
|
||||||
1948.6097367533557
|
1948.6097367533557
|
||||||
1892.0990307008867
|
1892.0990307008867
|
||||||
1881.7539718505154
|
1882.4301864075958
|
||||||
1898.8163564591582
|
1898.8163564591582
|
||||||
1891.7720648916354
|
1891.7720648916354
|
||||||
1899.1896641539054
|
1899.1896641539054
|
||||||
@ -13607,7 +13608,8 @@
|
|||||||
1899.4677481479275
|
1899.4677481479275
|
||||||
1832.0157188177106
|
1832.0157188177106
|
||||||
1830.994476738317
|
1830.994476738317
|
||||||
1859.8255318357274
|
1872.857763141983
|
||||||
|
1887.1141759579975
|
||||||
1821.8836244133079
|
1821.8836244133079
|
||||||
1913.4663037228643
|
1913.4663037228643
|
||||||
1985.0371631137966
|
1985.0371631137966
|
||||||
@ -14150,7 +14152,7 @@
|
|||||||
1958.9030832469919
|
1958.9030832469919
|
||||||
1917.5848215968706
|
1917.5848215968706
|
||||||
1905.0147395763986
|
1905.0147395763986
|
||||||
1871.6714142048124
|
1871.3321978094336
|
||||||
1901.0391754660595
|
1901.0391754660595
|
||||||
1871.966900926708
|
1871.966900926708
|
||||||
1965.8106578756367
|
1965.8106578756367
|
||||||
@ -17368,7 +17370,7 @@
|
|||||||
1863.7139407495256
|
1863.7139407495256
|
||||||
1980.5486905106713
|
1980.5486905106713
|
||||||
1820.0882670928129
|
1820.0882670928129
|
||||||
1856.3160414564259
|
1855.6257391640597
|
||||||
1921.6397748707468
|
1921.6397748707468
|
||||||
1970.804687384616
|
1970.804687384616
|
||||||
1902.8181073379312
|
1902.8181073379312
|
||||||
@ -19795,7 +19797,7 @@
|
|||||||
1917.3208523541055
|
1917.3208523541055
|
||||||
1850.9065744029447
|
1850.9065744029447
|
||||||
1912.2333094584328
|
1912.2333094584328
|
||||||
1837.7607134713
|
1837.590902324513
|
||||||
1969.993000236959
|
1969.993000236959
|
||||||
1956.0008619219907
|
1956.0008619219907
|
||||||
1941.4140218594555
|
1941.4140218594555
|
||||||
|
|
8
main.py
8
main.py
@ -1,3 +1,4 @@
|
|||||||
|
import csv
|
||||||
import pandas as pd
|
import pandas as pd
|
||||||
from sklearn.linear_model import LinearRegression
|
from sklearn.linear_model import LinearRegression
|
||||||
from sklearn.pipeline import make_pipeline
|
from sklearn.pipeline import make_pipeline
|
||||||
@ -6,8 +7,8 @@ from sklearn.feature_extraction.text import TfidfVectorizer
|
|||||||
col_names = ['start_date', 'end_date', 'title', 'source', 'content']
|
col_names = ['start_date', 'end_date', 'title', 'source', 'content']
|
||||||
|
|
||||||
train_set = pd.read_table('train/train.tsv.xz', error_bad_lines=False, header=None, names=col_names)
|
train_set = pd.read_table('train/train.tsv.xz', error_bad_lines=False, header=None, names=col_names)
|
||||||
dev_set = pd.read_table('dev-0/in.tsv', error_bad_lines=False, header=None, names=col_names[4:])
|
dev_set = pd.read_table('dev-0/in.tsv', error_bad_lines=False, header=None, names=col_names[4:], quoting=csv.QUOTE_NONE,)
|
||||||
test_set = pd.read_table('test-A/in.tsv', error_bad_lines=False, header=None, names=col_names[4:])
|
test_set = pd.read_table('test-A/in.tsv', error_bad_lines=False, header=None, names=col_names[4:], quoting=csv.QUOTE_NONE,)
|
||||||
|
|
||||||
train_set = train_set.head(10000)
|
train_set = train_set.head(10000)
|
||||||
|
|
||||||
@ -17,6 +18,9 @@ y_train = (train_set['start_date'] + train_set['end_date']) / 2
|
|||||||
X_dev = dev_set['content']
|
X_dev = dev_set['content']
|
||||||
X_test = test_set['content']
|
X_test = test_set['content']
|
||||||
|
|
||||||
|
print(dev_set)
|
||||||
|
print(test_set)
|
||||||
|
|
||||||
print('Trenowanie modelu...')
|
print('Trenowanie modelu...')
|
||||||
model = make_pipeline(TfidfVectorizer(), LinearRegression())
|
model = make_pipeline(TfidfVectorizer(), LinearRegression())
|
||||||
model.fit(X_train, y_train)
|
model.fit(X_train, y_train)
|
||||||
|
@ -206,7 +206,7 @@
|
|||||||
1928.6587695672113
|
1928.6587695672113
|
||||||
1990.9156424576067
|
1990.9156424576067
|
||||||
1881.4836785253315
|
1881.4836785253315
|
||||||
1884.4519979671402
|
1884.046089520049
|
||||||
1877.4040287725156
|
1877.4040287725156
|
||||||
1911.8947608148899
|
1911.8947608148899
|
||||||
1899.7628344836432
|
1899.7628344836432
|
||||||
@ -961,7 +961,7 @@
|
|||||||
1920.806099260425
|
1920.806099260425
|
||||||
1934.7567428867874
|
1934.7567428867874
|
||||||
2000.6897694955856
|
2000.6897694955856
|
||||||
1914.538168494774
|
1915.0424831770722
|
||||||
1961.5348637593509
|
1961.5348637593509
|
||||||
1976.0306055365545
|
1976.0306055365545
|
||||||
1990.438972379044
|
1990.438972379044
|
||||||
@ -1458,7 +1458,7 @@
|
|||||||
1897.0381253809762
|
1897.0381253809762
|
||||||
1898.2169614742145
|
1898.2169614742145
|
||||||
1907.1817765399285
|
1907.1817765399285
|
||||||
1899.7781849186872
|
1900.5051189207925
|
||||||
1916.2254375826196
|
1916.2254375826196
|
||||||
1887.7589605584237
|
1887.7589605584237
|
||||||
1900.9036082026578
|
1900.9036082026578
|
||||||
@ -1944,7 +1944,7 @@
|
|||||||
1932.4369032498905
|
1932.4369032498905
|
||||||
1924.7608021483702
|
1924.7608021483702
|
||||||
1932.6665753305242
|
1932.6665753305242
|
||||||
1910.2637014903585
|
1911.1136741658142
|
||||||
1844.3306216770322
|
1844.3306216770322
|
||||||
1920.9735284228261
|
1920.9735284228261
|
||||||
1898.4191575441814
|
1898.4191575441814
|
||||||
@ -3448,7 +3448,8 @@
|
|||||||
1985.828576031535
|
1985.828576031535
|
||||||
1929.0980372984723
|
1929.0980372984723
|
||||||
1963.416770426545
|
1963.416770426545
|
||||||
1983.403262556507
|
1958.0061961875651
|
||||||
|
1979.5713424319551
|
||||||
1927.054394299714
|
1927.054394299714
|
||||||
1887.5844594202247
|
1887.5844594202247
|
||||||
1952.952473384423
|
1952.952473384423
|
||||||
@ -5241,7 +5242,7 @@
|
|||||||
1961.7395028010487
|
1961.7395028010487
|
||||||
1911.578177275467
|
1911.578177275467
|
||||||
1993.361626034721
|
1993.361626034721
|
||||||
1860.938964267848
|
1861.582235755756
|
||||||
1880.8873010116863
|
1880.8873010116863
|
||||||
1891.0584427244678
|
1891.0584427244678
|
||||||
1927.9286642737504
|
1927.9286642737504
|
||||||
@ -6326,7 +6327,7 @@
|
|||||||
1894.4410835153267
|
1894.4410835153267
|
||||||
1961.8656695163497
|
1961.8656695163497
|
||||||
1918.6540411919113
|
1918.6540411919113
|
||||||
1902.5162709462134
|
1901.772008274914
|
||||||
1970.120121368801
|
1970.120121368801
|
||||||
1958.8069602196501
|
1958.8069602196501
|
||||||
1822.1082097880283
|
1822.1082097880283
|
||||||
@ -8450,7 +8451,7 @@
|
|||||||
1937.635613281464
|
1937.635613281464
|
||||||
1931.6145334405564
|
1931.6145334405564
|
||||||
1911.15006803172
|
1911.15006803172
|
||||||
1937.8085829935567
|
1937.807751149183
|
||||||
1911.5828102456112
|
1911.5828102456112
|
||||||
1923.676307918832
|
1923.676307918832
|
||||||
1934.4279819781618
|
1934.4279819781618
|
||||||
@ -10178,7 +10179,7 @@
|
|||||||
1923.6971313843694
|
1923.6971313843694
|
||||||
1914.7503506572486
|
1914.7503506572486
|
||||||
1958.747533690674
|
1958.747533690674
|
||||||
1917.7393715934418
|
1918.0059649038217
|
||||||
1909.3267326347955
|
1909.3267326347955
|
||||||
1982.6082963993645
|
1982.6082963993645
|
||||||
1963.8563866041861
|
1963.8563866041861
|
||||||
@ -11287,7 +11288,7 @@
|
|||||||
1930.5405282461093
|
1930.5405282461093
|
||||||
1855.5220302615335
|
1855.5220302615335
|
||||||
1952.8298961854482
|
1952.8298961854482
|
||||||
1893.2863705412592
|
1892.6402597321664
|
||||||
1928.501989244598
|
1928.501989244598
|
||||||
1967.1929378220514
|
1967.1929378220514
|
||||||
1911.8069275316302
|
1911.8069275316302
|
||||||
@ -13417,7 +13418,7 @@
|
|||||||
2002.918285090558
|
2002.918285090558
|
||||||
1907.5419986831682
|
1907.5419986831682
|
||||||
1982.5755707544743
|
1982.5755707544743
|
||||||
1844.5958529536363
|
1844.823717363196
|
||||||
1940.7293100159388
|
1940.7293100159388
|
||||||
1939.6370593406318
|
1939.6370593406318
|
||||||
1910.3139645164986
|
1910.3139645164986
|
||||||
|
|
Loading…
Reference in New Issue
Block a user