duckling/Duckling/Email/EN/Rules.hs
Lukas Koebis 0d7939b246 Email/EN: Allow 'dot' in emails.
Summary: Duckling supports emails like "hey at things.com" but not "hey at things dot com". Let's add that.

Reviewed By: patapizza

Differential Revision: D6387471

fbshipit-source-id: 349a3a1ee55983daf5fda7579623f0c7bb32357f
2017-12-04 14:01:10 -08:00

43 lines
1.2 KiB
Haskell

-- Copyright (c) 2016-present, Facebook, Inc.
-- All rights reserved.
--
-- This source code is licensed under the BSD-style license found in the
-- LICENSE file in the root directory of this source tree. An additional grant
-- of patent rights can be found in the PATENTS file in the same directory.
{-# LANGUAGE GADTs #-}
{-# LANGUAGE OverloadedStrings #-}
module Duckling.Email.EN.Rules
( rules ) where
import Data.String
import Prelude
import qualified Data.Text as Text
import Duckling.Dimensions.Types
import Duckling.Email.Types (EmailData (..))
import Duckling.Regex.Types
import Duckling.Types
import qualified Duckling.Email.Types as TEmail
ruleEmailSpelledOut :: Rule
ruleEmailSpelledOut = Rule
{ name = "email spelled out"
, pattern =
[ regex "([\\w_+-]+(?:(?: dot |\\.)[\\w_+-]+){0,10})(?: at |@)([a-zA-Z]+(?:(?:\\.| dot )[\\w_-]+){1,10})"
]
, prod = \xs -> case xs of
(Token RegexMatch (GroupMatch (m1:m2:_)):_) ->
Just $ Token Email EmailData
{ TEmail.value = Text.concat [replaceDots m1, "@", replaceDots m2] }
where replaceDots = Text.replace " dot " "."
_ -> Nothing
}
rules :: [Rule]
rules =
[ ruleEmailSpelledOut
]