commit ea55197312648d098ecc5a6ff5657a497b0fd117 Author: siulkilulki Date: Mon Apr 6 15:32:46 2020 +0200 Init master diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..1c18d74 --- /dev/null +++ b/.gitignore @@ -0,0 +1,8 @@ + +*~ +*.swp +*.bak +*.pyc +*.o +.DS_Store +.token diff --git a/README.md b/README.md new file mode 100644 index 0000000..77bd042 --- /dev/null +++ b/README.md @@ -0,0 +1,13 @@ +Guess the date of reddits (large edition) +================================ + +Guess a reddit date based on its text. +This is larger version with more reddits and subrredits (topics) than in . + +Output label is `FLOAT-YEAR`, a human friendly timestamp. +`FLOAT-YEAR`=1970 + `posix_time`/(60\*60\*24\*365.25) + +Sources +------- + +Data taken from . diff --git a/config.txt b/config.txt new file mode 100644 index 0000000..ca8d11f --- /dev/null +++ b/config.txt @@ -0,0 +1 @@ +--metric MSE --precision 4 --in-header in-header.tsv --out-header out-header.tsv diff --git a/dev-0/expected.tsv.xz b/dev-0/expected.tsv.xz new file mode 100644 index 0000000..a6a78df Binary files /dev/null and b/dev-0/expected.tsv.xz differ diff --git a/dev-0/in.tsv.xz b/dev-0/in.tsv.xz new file mode 100644 index 0000000..423f4a6 Binary files /dev/null and b/dev-0/in.tsv.xz differ diff --git a/in-header.tsv b/in-header.tsv new file mode 100644 index 0000000..4a4a4b0 --- /dev/null +++ b/in-header.tsv @@ -0,0 +1 @@ +PostText diff --git a/out-header.tsv b/out-header.tsv new file mode 100644 index 0000000..0767caf --- /dev/null +++ b/out-header.tsv @@ -0,0 +1 @@ +Label diff --git a/test-A/in.tsv.xz b/test-A/in.tsv.xz new file mode 100644 index 0000000..75a5c1d Binary files /dev/null and b/test-A/in.tsv.xz differ diff --git a/train/expected.tsv.xz b/train/expected.tsv.xz new file mode 100644 index 0000000..c1e6632 Binary files /dev/null and b/train/expected.tsv.xz differ diff --git a/train/in.tsv.xz b/train/in.tsv.xz new file mode 100644 index 0000000..8c69d6f Binary files /dev/null and b/train/in.tsv.xz differ