-- Copyright (c) 2016-present, Facebook, Inc. -- All rights reserved. -- -- This source code is licensed under the BSD-style license found in the -- LICENSE file in the root directory of this source tree. An additional grant -- of patent rights can be found in the PATENTS file in the same directory. {-# LANGUAGE GADTs #-} {-# LANGUAGE NoRebindableSyntax #-} {-# LANGUAGE OverloadedStrings #-} module Duckling.Duration.EL.Rules ( rules ) where import Data.HashMap.Strict (HashMap) import Data.String import Data.Text (Text) import Prelude import qualified Data.HashMap.Strict as HashMap import qualified Data.Text as Text import Duckling.Dimensions.Types import Duckling.Duration.Helpers import Duckling.Duration.Types (DurationData (DurationData)) import Duckling.Numeral.Helpers (integer, numeralMapEL, parseInt, parseInteger) import Duckling.Numeral.Types (NumeralData(..)) import Duckling.Regex.Types import Duckling.Types import qualified Duckling.Numeral.Types as TNumeral import qualified Duckling.TimeGrain.Types as TG timeGrainMap :: HashMap Text TG.Grain timeGrainMap = HashMap.fromList [ ( "λεπτο" , TG.Minute ) , ( "ωρο" , TG.Hour ) , ( "μερο" , TG.Day ) , ( "ήμερο" , TG.Day ) , ( "μηνο" , TG.Month ) , ( "ετία" , TG.Year ) , ( "ετίας" , TG.Year ) , ( "ετή" , TG.Year ) , ( "ετέ" , TG.Year ) , ( "χρονο" , TG.Year ) ] ruleDurationQuarterOfAnHour :: Rule ruleDurationQuarterOfAnHour = Rule { name = "quarter of an hour" , pattern = [ regex "(1/4|[εέ]ν(α|ός)\\s+τ[εέ]τ[αά]ρτου?)(\\s*ω|\\s+(της\\s+)?ώρας)?" ] , prod = \_ -> Just . Token Duration $ duration TG.Minute 15 } ruleDurationHalfAnHour :: Rule ruleDurationHalfAnHour = Rule { name = "half an hour" , pattern = [ regex "(1/2\\s?((της )?ώρας?|ω)|μισάωρου?)" ] , prod = \_ -> Just . Token Duration $ duration TG.Minute 30 } ruleDurationThreeQuartersOfAnHour :: Rule ruleDurationThreeQuartersOfAnHour = Rule { name = "three quarters of an hour" , pattern = [ regex "(3/4|τρ[ιί](α|ών)\\s+τ[εέ]τ[αά]ρτ(α|ων))(\\s*ω|\\s+(της\\s+)?ώρας)?" ] , prod = \_ -> Just . Token Duration $ duration TG.Minute 45 } -- TODO: Single-word composition (#110) ruleNumeralWithGrain :: Rule ruleNumeralWithGrain = Rule { name = " (one word)" , pattern = [ regex $ "(δ[ιί]|τρ[ιί]|τετρ|πεν[θτ]|εξ|ε[πφ]τ|ο[κχ]τ|εννι|δεκ|" ++ "δεκαπεν[θτ]|εικοσ|εικοσιπεν[θτ]|τριαντ|τριανταπεν[θτ]|σαραντ|" ++ "σαρανταπεν[θτ]|πενηντ|πενηνταπεν[θτ]|εξηντ|ενενηντ)[αά]?" ++ "(λεπτο|ωρο|ή?μερο|μηνο|ετία?|ετ[ήέ]|χρονο)ς?υ?" ] , prod = \tokens -> case tokens of ( Token RegexMatch (GroupMatch (m:g:_)) : _ ) -> (Token Duration .) . duration <$> HashMap.lookup (Text.toLower g) timeGrainMap <*> HashMap.lookup (Text.toLower m) numeralMapEL _ -> Nothing } ruleNumeralQuotes :: Rule ruleNumeralQuotes = Rule { name = " + '\"" , pattern = [ Predicate isNatural , regex "(['\"])" ] , prod = \tokens -> case tokens of (Token Numeral NumeralData{TNumeral.value = v}: Token RegexMatch (GroupMatch (x:_)): _) -> case x of "'" -> Just . Token Duration . duration TG.Minute $ floor v "\"" -> Just . Token Duration . duration TG.Second $ floor v _ -> Nothing _ -> Nothing } ruleDurationMoreNumeral :: Rule ruleDurationMoreNumeral = Rule { name = " more " , pattern = [ Predicate isNatural , regex "ακόμα|λιγότερ[οη]" , dimension TimeGrain ] , prod = \tokens -> case tokens of (Token Numeral nd:_:Token TimeGrain grain:_) -> Just . Token Duration . duration grain . floor $ TNumeral.value nd _ -> Nothing } ruleDurationNumeralMore :: Rule ruleDurationNumeralMore = Rule { name = " more " , pattern = [ Predicate isNatural , dimension TimeGrain , regex "ακόμα|λιγότερ[οη]" ] , prod = \tokens -> case tokens of (Token Numeral nd:Token TimeGrain grain:_:_) -> Just . Token Duration . duration grain . floor $ TNumeral.value nd _ -> Nothing } ruleDurationDotNumeralHours :: Rule ruleDurationDotNumeralHours = Rule { name = "number.number hours" , pattern = [ regex "(\\d+),(\\d+)" , dimension TimeGrain ] , prod = \tokens -> case tokens of (Token RegexMatch (GroupMatch (h:m:_)):Token TimeGrain TG.Hour:_) -> do hh <- parseInteger h mnum <- parseInteger m let mden = 10 ^ Text.length m Just . Token Duration $ minutesFromHourMixedFraction hh mnum mden _ -> Nothing } ruleHalfDuration :: Rule ruleHalfDuration = Rule { name = "half a " , pattern = [ regex "μισ[ήό]ς?" , dimension TimeGrain ] , prod = \tokens -> case tokens of (_:Token TimeGrain g:_) -> Token Duration <$> timesOneAndAHalf g 0 _ -> Nothing } ruleDurationAndAHalf :: Rule ruleDurationAndAHalf = Rule { name = " and a half " , pattern = [ Predicate isNatural , regex "και μισ[ήό]ς?" , dimension TimeGrain ] , prod = \tokens -> case tokens of (Token Numeral nd:_:Token TimeGrain grain:_) -> timesOneAndAHalf grain (floor $ TNumeral.value nd) >>= Just . Token Duration _ -> Nothing } ruleDurationAndAHalfOneWord :: Rule ruleDurationAndAHalfOneWord = Rule { name = " " , pattern = [ regex $ "(μιά|ενά|δυό|τρεισή|τεσσερι?σή|πεντέ|εξί|ε[πφ]τά|ο[κχ]τώ|εννιά|" ++ "δεκά|εντεκά|δωδεκά)μισ[ιη]ς?" , dimension TimeGrain ] , prod = \tokens -> case tokens of (Token RegexMatch (GroupMatch (num:_)):Token TimeGrain grain:_) -> HashMap.lookup (Text.toLower num) numeralMapEL >>= timesOneAndAHalf grain >>= Just . Token Duration _ -> Nothing } ruleDurationPrecision :: Rule ruleDurationPrecision = Rule { name = "about|exactly " , pattern = [ regex "(περίπου|πάνω κάτω|ακριβώς)" , dimension Duration ] , prod = \tokens -> case tokens of (_:token:_) -> Just token _ -> Nothing } rules :: [Rule] rules = [ ruleDurationQuarterOfAnHour , ruleDurationHalfAnHour , ruleNumeralQuotes , ruleDurationNumeralMore , ruleDurationMoreNumeral , ruleNumeralWithGrain , ruleDurationThreeQuartersOfAnHour , ruleDurationDotNumeralHours , ruleHalfDuration , ruleDurationAndAHalf , ruleDurationAndAHalfOneWord , ruleDurationPrecision ]