Improve detecting wrong metrics during validation

This commit is contained in:
Filip Gralinski 2021-07-29 14:55:59 +02:00
parent 905705bfd5
commit 8dbcb548ae
14 changed files with 82 additions and 12 deletions

View File

@ -136,6 +136,7 @@ data GEvalException = NoExpectedFile FilePath
| OtherException String | OtherException String
| NoHeaderFile FilePath | NoHeaderFile FilePath
| UnknownMetric String | UnknownMetric String
| UnknownFlags String
deriving (Eq) deriving (Eq)
instance Exception GEvalException instance Exception GEvalException
@ -159,6 +160,7 @@ instance Show GEvalException where
show (OtherException message) = message show (OtherException message) = message
show (NoHeaderFile filePath) = somethingWrongWithFilesMessage "No file with header specification" filePath show (NoHeaderFile filePath) = somethingWrongWithFilesMessage "No file with header specification" filePath
show (UnknownMetric t) = "Unknown or broken metric definition: " ++ t show (UnknownMetric t) = "Unknown or broken metric definition: " ++ t
show (UnknownFlags t) = "Unknown or broken metric flags: " ++ t
somethingWrongWithFilesMessage :: String -> FilePath -> String somethingWrongWithFilesMessage :: String -> FilePath -> String
somethingWrongWithFilesMessage msg filePath = Prelude.concat somethingWrongWithFilesMessage msg filePath = Prelude.concat

View File

@ -9,15 +9,16 @@ module GEval.EvaluationScheme
where where
import GEval.Metric import GEval.Metric
import GEval.Common
import Debug.Trace import Control.Exception
import Text.Regex.PCRE.Heavy import Text.Regex.PCRE.Heavy
import Text.Regex.PCRE.Light.Base (Regex(..)) import Text.Regex.PCRE.Light.Base (Regex(..))
import Text.Regex.PCRE.Light (compile) import Text.Regex.PCRE.Light (compile)
import Data.Text (Text(..), concat, toCaseFold, toLower, toUpper, pack, unpack, words, unwords) import Data.Text (Text, concat, toCaseFold, toLower, toUpper, pack, unpack, words, unwords)
import Data.List (intercalate, break, sort) import Data.List (intercalate, break, sort)
import Data.Either import Data.Char (isLetter)
import Data.Maybe (fromMaybe, catMaybes) import Data.Maybe (fromMaybe, catMaybes)
import qualified Data.ByteString.UTF8 as BSU import qualified Data.ByteString.UTF8 as BSU
@ -66,13 +67,17 @@ readOps ('N':theRest) = handleParametrizedOp (SetName . pack) theRest
readOps ('P':theRest) = handleParametrizedOp (SetPriority . read) theRest readOps ('P':theRest) = handleParametrizedOp (SetPriority . read) theRest
readOps ('s':theRest) = handleParametrizedBinaryOp (\a b -> RegexpSubstition (compile (BSU.fromString a) []) (pack b)) theRest readOps ('s':theRest) = handleParametrizedBinaryOp (\a b -> RegexpSubstition (compile (BSU.fromString a) []) (pack b)) theRest
readOps ('f':theRest) = handleParametrizedOp (FeatureFilter . pack) theRest readOps ('f':theRest) = handleParametrizedOp (FeatureFilter . pack) theRest
readOps s = ([], s) -- this is not the right way to do this, but try catch at least unknown flags
readOps t@(c:_) = if isLetter c
then throw $ UnknownFlags t
else ([], t)
readOps "" = ([], "")
getRegexpMatch :: EvaluationScheme -> Maybe Regex getRegexpMatch :: EvaluationScheme -> Maybe Regex
getRegexpMatch (EvaluationScheme _ ops) = getRegexpMatch' ops getRegexpMatch (EvaluationScheme _ ops) = getRegexpMatch' ops
where getRegexpMatch' [] = Nothing where getRegexpMatch' [] = Nothing
getRegexpMatch' ((RegexpMatch regex):_) = Just regex getRegexpMatch' ((RegexpMatch regex):_) = Just regex
getRegexpMatch' (_:ops) = getRegexpMatch' ops getRegexpMatch' (_:ops') = getRegexpMatch' ops'
handleParametrizedOp :: (String -> PreprocessingOperation) -> String -> ([PreprocessingOperation], String) handleParametrizedOp :: (String -> PreprocessingOperation) -> String -> ([PreprocessingOperation], String)
handleParametrizedOp constructor theRest = handleParametrizedOp constructor theRest =
@ -92,11 +97,13 @@ handleParametrizedBinaryOp constructor theRest =
in ((constructor paramA paramB):ops, theRest''') in ((constructor paramA paramB):ops, theRest''')
parseParameter :: String -> (Maybe String, String) parseParameter :: String -> (Maybe String, String)
parseParameter (leftParameterBracket:theRest) = parseParameter [] = (Nothing, [])
case break (== rightParameterBracket) theRest of parseParameter t@(fChar:theRest) =
(s, []) -> (Nothing, s) if fChar == leftParameterBracket
(param, (_:theRest')) -> (Just param, theRest') then case break (== rightParameterBracket) theRest of
parseParameter s = (Nothing, s) (s, []) -> throw $ UnknownFlags t
(param, (_:theRest')) -> (Just param, theRest')
else throw $ UnknownFlags t
instance Show EvaluationScheme where instance Show EvaluationScheme where
@ -105,9 +112,10 @@ instance Show EvaluationScheme where
else ":" ++ (Prelude.concat (map show operations))) else ":" ++ (Prelude.concat (map show operations)))
evaluationSchemeName :: EvaluationScheme -> String evaluationSchemeName :: EvaluationScheme -> String
evaluationSchemeName scheme@(EvaluationScheme metric operations) = fromMaybe (show scheme) (findNameSet operations) evaluationSchemeName scheme@(EvaluationScheme _ operations) = fromMaybe (show scheme) (findNameSet operations)
evaluationSchemePriority scheme@(EvaluationScheme _ operations) = fromMaybe defaultPriority (findPrioritySet operations) evaluationSchemePriority :: EvaluationScheme -> Int
evaluationSchemePriority (EvaluationScheme _ operations) = fromMaybe defaultPriority (findPrioritySet operations)
where defaultPriority = 1 where defaultPriority = 1
findNameSet :: [PreprocessingOperation] -> Maybe String findNameSet :: [PreprocessingOperation] -> Maybe String

View File

@ -700,6 +700,10 @@ main = hspec $ do
gesFormatting = FormattingOptions (Just 4) False } gesFormatting = FormattingOptions (Just 4) False }
createChallenge True tempDir spec createChallenge True tempDir spec
validationChallenge tempDir spec validationChallenge tempDir spec
describe "check validation on broken challenges" $ do
it "broken metric" $ do
(hSilence [stderr] $ runGEval ["--validate", "--expected-directory", "test/_validation/broken-metric"]) `shouldThrow` anyException
describe "test sample outputs" $ do describe "test sample outputs" $ do
(flip mapM_ ) (Prelude.filter isEvaluationSchemeDescribed listOfAvailableEvaluationSchemes) $ \scheme@(EvaluationScheme metric _) -> do (flip mapM_ ) (Prelude.filter isEvaluationSchemeDescribed listOfAvailableEvaluationSchemes) $ \scheme@(EvaluationScheme metric _) -> do
it (show scheme) $ do it (show scheme) $ do

View File

@ -0,0 +1,8 @@
*~
*.swp
*.bak
*.pyc
*.o
.DS_Store
.token

View File

@ -0,0 +1,27 @@
Tag names and their component
=============================
Tag names and their components (first name/surname) in a text.
Tags:
* person
* surname
* first-name
For each tag a sequence of token IDs separated with commas should be given (after a slash).
Directory structure
-------------------
* `README.md` — this file
* `config.txt` — configuration file
* `train/` — directory with training data
* `train/in.tsv` — input data for the train set
* `train/expected.tsv` — expected (reference) data for the train set
* `dev-0/` — directory with dev (test) data
* `dev-0/in.tsv` — input data for the dev set
* `dev-0/expected.tsv` — expected (reference) data for the dev set
* `test-A` — directory with test data
* `test-A/in.tsv` — input data for the test set
* `test-A/expected.tsv` — expected (reference) data for the test set

View File

@ -0,0 +1 @@
--metric MultiLabel-F1 --metric WER:P-S<3>u --in-header in-header.tsv --out-header out-header.tsv

View File

@ -0,0 +1,3 @@
person/1,2 first-name/1 surname/2
first-name/1
1 person/1,2 first-name/1 surname/2
2 first-name/1

View File

@ -0,0 +1,3 @@
Jan Kowalski is here
I see him
Barbara
1 Jan Kowalski is here
2 I see him
3 Barbara

View File

@ -0,0 +1 @@
Text
1 Text

View File

@ -0,0 +1 @@
Entities
1 Entities

View File

@ -0,0 +1,3 @@
person/1,3 first-name/1 surname/3
first-name/3
1 person/1,3 first-name/1 surname/3
2 first-name/3

View File

@ -0,0 +1,3 @@
John bloody Smith
Nobody is there
I saw Marketa
1 John bloody Smith
2 Nobody is there
3 I saw Marketa

View File

@ -0,0 +1,3 @@
I know Mr John Smith
Steven bloody Brown
James and James
1 I know Mr John Smith
2 Steven bloody Brown
3 James and James

View File

@ -0,0 +1,3 @@
person/3,4,5 first-name/4 surname/5
person/1,3 first-name/1 surname/3
first-name/1 firstname/3
1 person/3,4,5 first-name/4 surname/5
2 person/1,3 first-name/1 surname/3
3 first-name/1 firstname/3