add MAP metric

2017-12-12 07:54:21 +01:00 · 2017-12-12 07:54:21 +01:00 · 9643719193
commit 9643719193
parent 7eef53832d
8 changed files with 80 additions and 4 deletions
--- a/src/GEval/Core.hs
+++ b/src/GEval/Core.hs
@ -58,6 +58,7 @@ defaultLogLossHashedSize :: Word32
 defaultLogLossHashedSize = 10

 data Metric = RMSE | MSE | BLEU | Accuracy | ClippEU | FMeasure Double | NMI | LogLossHashed Word32 | CharMatch
+              | MAP
              deriving (Eq)

 instance Show Metric where
@ -75,6 +76,7 @@ instance Show Metric where
                                                      else
                                                       (show nbOfBits))
  show CharMatch = "CharMatch"
+  show MAP = "MAP"

 instance Read Metric where
  readsPrec _ ('R':'M':'S':'E':theRest) = [(RMSE, theRest)]
@ -90,6 +92,7 @@ instance Read Metric where
    [(nbOfBits, theRest)] -> [(LogLossHashed nbOfBits, theRest)]
    _ -> [(LogLossHashed defaultLogLossHashedSize, theRest)]
  readsPrec p ('C':'h':'a':'r':'M':'a':'t':'c':'h':theRest) = [(CharMatch, theRest)]
+  readsPrec _ ('M':'A':'P':theRest) = [(MAP, theRest)]

 data MetricOrdering = TheLowerTheBetter | TheHigherTheBetter

@ -103,6 +106,7 @@ getMetricOrdering (FMeasure _) = TheHigherTheBetter
 getMetricOrdering NMI = TheHigherTheBetter
 getMetricOrdering (LogLossHashed _) = TheLowerTheBetter
 getMetricOrdering CharMatch = TheHigherTheBetter
+getMetricOrdering MAP = TheHigherTheBetter

 defaultOutDirectory = "."
 defaultTestName = "test-A"
@ -262,6 +266,12 @@ gevalCore' ClippEU _ = gevalCoreWithoutInput parseClippingSpecs parseClippings m

 gevalCore' NMI _ = gevalCoreWithoutInput id id id (CC.foldl updateConfusionMatrix M.empty) normalizedMutualInformationFromConfusionMatrix

+gevalCore' MAP _ = gevalCoreWithoutInput (DLS.splitOn "\t" . unpack)
+                                         (DLS.splitOn "\t" . unpack)
+                                         (\(e,g) -> calculateMAPForOneResult e g)
+                                         averageC
+                                         id
+
 gevalCore' (LogLossHashed nbOfBits) _ = helper nbOfBits
  -- for LogLossHashed we "salt" each hash with the line number
  where helper nbOfBits expectedFilePath outFilePath =
--- a/src/GEval/CreateChallenge.hs
+++ b/src/GEval/CreateChallenge.hs
@ -142,6 +142,24 @@ Directory structure
 * `${testName}/expected.tsv` — American reference text for the test set
 |]

+readmeMDContents MAP testName = [i|
+English word for a Polish word
+================================================
+
+Give a (British or American) English equivalent of a Polish word.
+
+This is a sample challenge for MAP evaluation metric. MAP (Mean Average Precision)
+is used, mostly in information retrieval, for evaluation of ranked retrieval results.
+
+The relevant items are separated by TABs (could be just one item) and returned items
+should be separated by TABs.
+
+See Christopher D. Manning, Prabhakar Raghavan and Hinrich Schütze,
+"Introduction to Information Retrieval", Cambridge University Press, 2008 for
+more discussion of the metric.
+|] ++ (commonReadmeMDContents testName)
+
+
 readmeMDContents _ testName = [i|
 GEval sample challenge
 ======================
@ -209,7 +227,6 @@ trainContents NMI = [hereLit|pl	Kto pod kim dołki kopie, ten sam w nie wpada.
 en	The pen is mightier than the sword.
 pl	Baba z wozu, koniom lżej.
 |]
-
 trainContents (LogLossHashed _) = [hereLit|Ala ma psa i kota
 Basia ma psa
 Nie kupujemy kota w worku
@ -220,6 +237,11 @@ Camptown race-track five miles long, Oh, doo-dah day!
 I come down dah wid my hat caved in, Doo-dah! doo-dah!
 I go back home wid a pocket full of tin, Oh, doo-dah day!
 |]
+trainContents MAP = [hereLit|honor	US	honor
+honour	GB	honor
+titbit	GB	smakołyk
+tidbit	US	smakołyk
+|]
 trainContents _ = [hereLit|0.06	0.39	0	0.206
 1.00	1.00	1	0.017
 317.8	5.20	67	0.048
@ -247,6 +269,10 @@ devInContents CharMatch = [hereLit|honour to organise
 nothing to change
 time traveller
 |]
+devInContents MAP = [hereLit|US	noc
+GB	wózek dziecięcy
+GB	wizualizować
+|]
 devInContents _ = [hereLit|0.72	0	0.007
 9.54	62	0.054
 |]
@ -272,6 +298,10 @@ devExpectedContents CharMatch = [hereLit|honor to organize
 nothing to change
 time traveler
 |]
+devExpectedContents MAP = [hereLit|night	nite
+pram
+visualise
+|]
 devExpectedContents _ = [hereLit|0.82
 95.2
 |]
@ -299,6 +329,10 @@ testInContents CharMatch = [hereLit|paralysed by practise
 recognise
 nothing
 |]
+testInContents MAP = [hereLit|US	wózek dziecięcy
+GB	słoń
+US	słoń
+|]
 testInContents _ = [hereLit|1.52	2	0.093
 30.06	14	0.009
 |]
@ -326,6 +360,10 @@ testExpectedContents CharMatch = [hereLit|paralyzed by practice
 recognize
 nothing
 |]
+testExpectedContents MAP = [hereLit|trolley
+elephant
+elephant
+|]
 testExpectedContents _ = [hereLit|0.11
 17.2
 |]
--- a/src/GEval/OptionsParser.hs
+++ b/src/GEval/OptionsParser.hs
@ -82,7 +82,7 @@ metricReader = option auto
                 <> value defaultMetric
                 <> showDefault
                 <> metavar "METRIC"
-                 <> help "Metric to be used - RMSE, MSE, Accuracy, F-measure (specify as F1, F2, F0.25, etc.), BLEU, NMI, ClippEU, LogLossHashed or CharMatch" )
+                 <> help "Metric to be used - RMSE, MSE, Accuracy, F-measure (specify as F1, F2, F0.25, etc.), MAP, BLEU, NMI, ClippEU, LogLossHashed or CharMatch" )

 runGEval :: [String] -> IO (Either (ParserResult GEvalOptions) (Maybe MetricValue))
 runGEval args = do
--- a/src/GEval/PrecisionRecall.hs
+++ b/src/GEval/PrecisionRecall.hs
@ -1,6 +1,7 @@
 {-# LANGUAGE PartialTypeSignatures #-}

-module GEval.PrecisionRecall(fMeasure, f1Measure, f2Measure, precision, recall,
+module GEval.PrecisionRecall(calculateMAPForOneResult,
+                             fMeasure, f1Measure, f2Measure, precision, recall,
                             fMeasureOnCounts, f1MeasureOnCounts, f2MeasureOnCounts, countFolder,
                             precisionAndRecall, precisionAndRecallFromCounts, maxMatch)
       where
@ -10,6 +11,18 @@ import GEval.Common
 import Data.Graph.Inductive
 import Data.Graph.Inductive.Query.MaxFlow

+import Data.List (nub, foldl')
+
+calculateMAPForOneResult :: (Eq a) => [a] -> [a] -> Double
+calculateMAPForOneResult expected got = precisionSum / fromIntegral (length expected)
+  where (_, _, precisionSum) = calculateMAPForOneResultCore expected (nub got)
+        calculateMAPForOneResultCore expected got = foldl' (oneMAPStep expected) (0, 0, 0.0) got
+        oneMAPStep expected (gotCount, allCount, precisionSum) gotItem
+          | gotItem `elem` expected = (newGotCount, newAllCount, precisionSum + (newGotCount /. newAllCount))
+          | otherwise = (gotCount, newAllCount, precisionSum)
+         where newGotCount = gotCount + 1
+               newAllCount = allCount + 1
+
 f2Measure :: (a -> b -> Bool) -> [a] -> [b] -> Double
 f2Measure = fMeasure 2.0

--- a/test/Spec.hs
+++ b/test/Spec.hs
@ -166,7 +166,15 @@ main = hspec $ do
      runGEvalTest "charmatch-complex" `shouldReturnAlmost` 0.1923076923076923
    it "broken test without input" $ do
      runGEvalTest "charmatch-no-input" `shouldThrow` (== NoInputFile "test/charmatch-no-input/charmatch-no-input/test-A/in.tsv")
-
+  describe "MAP" $ do
+    it "one result" $ do
+      (calculateMAPForOneResult ["Berlin", "London", "Warsaw"]
+                                ["Warsaw", "Moscow", "Berlin", "Prague"]) `shouldBeAlmost` 0.55555555
+    it "check whether you cannot cheat with duplicated results" $ do
+      (calculateMAPForOneResult ["one", "two"]
+                                ["one", "one"]) `shouldBeAlmost` 0.5
+    it "simple test" $ do
+      runGEvalTest "map-simple" `shouldReturnAlmost` 0.444444444

 neverMatch :: Char -> Int -> Bool
 neverMatch _ _ = False
--- a/test/map-simple/map-simple-solution/test-A/out.tsv
+++ b/test/map-simple/map-simple-solution/test-A/out.tsv
@ -0,0 +1,3 @@
+pink	blue
+red	yellow	rose	black
+white	gray
--- a/test/map-simple/map-simple/config.txt
+++ b/test/map-simple/map-simple/config.txt
@ -0,0 +1 @@
+--metric MAP
--- a/test/map-simple/map-simple/test-A/expected.tsv
+++ b/test/map-simple/map-simple/test-A/expected.tsv
@ -0,0 +1,3 @@
+blue
+red	rose
+green