duckling/Duckling/Email/EN/Corpus.hs
Lukas Koebis 0d7939b246 Email/EN: Allow 'dot' in emails.
Summary: Duckling supports emails like "hey at things.com" but not "hey at things dot com". Let's add that.

Reviewed By: patapizza

Differential Revision: D6387471

fbshipit-source-id: 349a3a1ee55983daf5fda7579623f0c7bb32357f
2017-12-04 14:01:10 -08:00

61 lines
1.5 KiB
Haskell

-- Copyright (c) 2016-present, Facebook, Inc.
-- All rights reserved.
--
-- This source code is licensed under the BSD-style license found in the
-- LICENSE file in the root directory of this source tree. An additional grant
-- of patent rights can be found in the PATENTS file in the same directory.
{-# LANGUAGE OverloadedStrings #-}
module Duckling.Email.EN.Corpus
( corpus
, negativeCorpus
) where
import Data.String
import Prelude
import qualified Data.Text as Text
import Duckling.Email.Types
import Duckling.Testing.Types
negativeCorpus :: NegativeCorpus
negativeCorpus = (testContext, examples)
where
examples =
[ "fitness at 6.40"
, "class at 12.00"
, "tonight at 9.15"
, " dot 2@abci"
, "x@ dot x"
, "x@ x dot "
, "abc@x dot "
, Text.replicate 10000 "a at a"
]
corpus :: Corpus
corpus = (testContext, allExamples)
allExamples :: [Example]
allExamples = concat
[ examples (EmailData "alice@exAmple.io")
[ "alice at exAmple.io"
]
, examples (EmailData "yo+yo@blah.org")
[ "yo+yo at blah.org"
]
, examples (EmailData "1234+abc@x.net")
[ "1234+abc at x.net"
]
, examples (EmailData "jean-jacques@stuff.co.uk")
[ "jean-jacques at stuff.co.uk"
]
, examples (EmailData "asdf+ab.c@gmail.com")
[ "asdf+ab dot c at gmail dot com"
]
, examples (EmailData "asdf.k@fb.com")
[ "asdf dot k@fb dot com"
]
]