diff --git a/dev-0/out.tsv b/dev-0/out.tsv new file mode 100644 index 0000000..c8b523e --- /dev/null +++ b/dev-0/out.tsv @@ -0,0 +1,87 @@ +[38 +43 + 5 +59 +73 +74 +57 +23 +76 + 8 +48 +24 +62 + 4 +10 +47 +27 +51 + 3 +61 +39 +35 +16 +17 + 34 + 1 +13 +16 + 9 +53 +71 +50 +63 +45 +28 +12 +37 +52 +13 +31 + 6 +29 +65 +56 +36 +22 +54 +49 + 70 +58 + 0 + 5 + 7 +42 +19 +17 +15 +20 +21 +33 +12 +32 +66 +44 +60 +30 +41 +46 +40 +11 +68 + 3 + 25 + 2 +55 +23 +64 +19 +14 +72 + 8 +69 + 8 +18 +75 +26 +67] \ No newline at end of file diff --git a/geval b/geval new file mode 100755 index 0000000..b68b316 Binary files /dev/null and b/geval differ diff --git a/prog.py b/prog.py index 0a10276..3843b76 100644 --- a/prog.py +++ b/prog.py @@ -3,11 +3,14 @@ import numpy as np import sklearn.metrics from sklearn.cluster import KMeans -with open("dev-0/in.tsv") as f: +with open("test-A/in.tsv") as f: content = f.readlines() vectorizer = TfidfVectorizer(ngram_range=(1,2), use_idf = False) vectorizer = TfidfVectorizer() document_vectors = vectorizer.fit_transform(content) - kmeans = KMeans(n_clusters=4, random_state=0).fit(document_vectors) + kmeans = KMeans(n_clusters=77, random_state=0).fit(document_vectors) pred_y = kmeans.fit_predict(document_vectors) - print(pred_y) + t=kmeans.labels_ + t=np.array2string(t, precision=2, separator='\n',suppress_small=True) + f = open("test-A/out.tsv", "a") + f.write(t) diff --git a/test-A/out.tsv b/test-A/out.tsv new file mode 100644 index 0000000..214a99c --- /dev/null +++ b/test-A/out.tsv @@ -0,0 +1,691 @@ +[ 1 + 5 +14 +50 +62 +64 +50 +40 +53 + 5 +41 +36 +76 +58 +39 +33 +12 +71 +12 +39 + 3 +67 +21 +52 + 68 +53 +68 +57 +40 +68 + 1 +76 +64 +33 +54 +63 +36 +33 +14 +76 +43 +50 +13 +19 +25 +58 +33 +20 + 14 +39 +14 +50 +33 +52 +17 +15 +33 +14 +44 +28 +73 +10 +68 +62 +39 + 7 +52 +64 +16 +53 + 3 +45 + 12 +33 +33 +33 +53 +37 +46 +53 +34 + 4 +42 +63 +62 +49 +33 +37 +65 +43 +61 + 3 +54 +62 +10 +13 + 1 +25 +34 +30 +37 +23 +12 +24 + 9 +70 +48 +53 +71 +16 + 2 +14 +74 +14 +60 +62 +65 +31 +48 +70 + 28 +40 +24 +70 +33 +14 +12 +15 +32 +33 +17 +54 +33 +15 +51 +54 +47 +53 +42 + 8 +69 +34 +28 + 8 + 48 +33 +16 + 8 +73 +15 +12 +13 +65 +29 +52 +36 +75 +38 + 9 +23 +66 + 1 +33 +20 +17 +62 +42 +30 + 45 + 0 +63 +21 +37 +50 +10 +42 +72 +41 +33 +31 +59 +28 +21 +51 +27 +33 +40 +18 +40 +17 + 1 +48 + 36 +70 + 1 +38 +33 +14 +33 + 1 +53 +27 + 1 +70 +12 +10 +14 +20 +65 + 1 +40 +21 + 5 +16 +20 +36 + 40 +21 +44 +74 +39 +33 + 3 +34 +18 +54 +66 +71 +42 +36 +33 +57 +15 +20 +64 +37 + 0 +52 +27 +33 + 50 +74 + 7 +57 +37 +44 + 3 + 3 +57 +20 + 6 +31 + 4 +26 +27 +18 + 2 +33 +30 +28 +15 +40 +13 +53 + 47 +29 +70 +16 +27 +39 +13 +33 +17 +28 +21 +13 +58 + 2 +28 + 9 +19 + 3 +60 +53 +26 +35 +28 +14 + 12 +11 +71 +70 +48 +53 + 1 + 3 +10 +35 +13 +57 +13 +71 +16 +17 +33 +41 +21 +16 + 5 +31 +65 +17 + 9 +76 +42 +17 +17 + 6 +20 +33 +46 +42 +67 + 5 + 6 +46 + 5 +60 +48 +58 +33 +71 +73 +15 +33 +14 + 37 + 9 +39 +39 + 5 +33 +26 +29 +52 +28 +17 +49 + 5 +33 +48 + 6 +17 +40 +75 +71 + 3 +53 +24 +10 + 40 +21 +48 +39 + 3 +53 +14 +76 +20 +66 +65 +33 +36 +57 +40 +17 +15 +10 +22 +56 +39 +53 +50 +25 + 1 + 2 +25 +36 +69 +64 + 1 + 7 +68 +14 +39 +63 + 1 +62 +75 +33 +58 +33 +15 + 2 +22 +29 +56 + 2 + 73 +19 +43 +35 +40 + 6 +15 +17 +20 +17 + 8 +75 +38 +73 +21 +21 +30 +27 +14 +62 +34 +29 +54 +52 + 20 +50 +59 +73 +50 +40 +52 +21 +44 +14 +46 +38 +12 +31 + 9 +59 +23 +58 +53 +50 +17 +57 +55 +21 + 53 +20 +43 + 3 +48 +70 +50 +16 +76 +10 +14 +33 +69 +43 +46 +30 +43 +30 +62 +58 +27 +21 +13 +44 + 66 +18 +46 +53 +48 +51 +33 + 3 +27 + 5 +69 +14 +20 + 3 +32 +71 +26 + 8 +62 +28 +25 +14 +16 +21 + 30 + 9 +23 + 9 + 2 +25 +64 +61 +21 +63 +27 +49 +31 +12 +63 +20 +19 +53 +66 +71 +65 +30 +21 +42 + 16 +76 +59 +71 +43 +14 +48 +67 +34 +29 +17 +70 +14 + 8 +62 +55 +21 +64 +33 +76 +53 +26 + 9 +43 + 27 +57 +54 + 4 + 1 + 1 +45 + 7 +64 +14 +60 +40 +53 +53 +15 +30 + 1 +54 +14 +14 +17 +63 + 9 +49 + 2 +24 +49 +16 +15 +28 +71 +64 +27 +71 + 4 +15 +28 + 3 +31 +60 +74 +21 +23 +63 + 1 +73 +73 +69 + 14 +39 +17 +29 +15 +60 +33 + 5 +55 +58 +36 +76 + 1 +24 +36 +21 +28 +20 + 5 +65 +51 +67 +17 +14 + 16 +18 +34 +53 +12 +34 +49 +20 +54 +17 +27 +53 +42 +52 +44 + 6 +39 + 1 +28 +15 +40 +30 +21 +22 + 57 +63 +17 +51 + 4 +49 +74 +33 +13 +27 +49 +22 +60 +21 +71 +17 +29 +76 +44 +50 +75 + 6 +23 +12 + 17 +66 + 1 +42 +33 + 1 +48 +21 +44 +54 +53 +30 + 2 +14 +39 +24 + 1 +43 +66] \ No newline at end of file