Time&Duration/ZH: support Cantonese and more common expressions (#516-2) (#523)

Summary:
**2nd set of changes from pull request https://github.com/facebook/duckling/issues/516

Supporting Cantonese and more common expressions in Chinese.
Adding rules file for Duration/ZH.

Pull Request resolved: https://github.com/facebook/duckling/pull/523

Reviewed By: haoxuany

Differential Revision: D23428901

Pulled By: chessai

fbshipit-source-id: 6d04c97b63bac966eb61d77cab2f08f7543dbbf0
This commit is contained in:
kckckcng 2021-01-26 15:08:09 -08:00 committed by Facebook GitHub Bot
parent 28ddc3bff7
commit a82684e723
12 changed files with 2039 additions and 1094 deletions

View File

@ -47,4 +47,60 @@ allExamples = concat
[ "10 月"
, "十 月"
]
, examples (DurationData 30 Minute)
[ "30分鐘"
, "半個鐘"
, "半小時"
, "三十分鐘"
, "卅分鐘"
]
, examples (DurationData 12 Hour)
[ "半日"
, "半天"
, "十二小時"
, "十二個鐘"
]
, examples (DurationData 90 Minute)
[ "一個半小時"
, "個半小時"
, "個半鐘"
, "一個半鐘"
, "1.5小時"
, "一個小時三十分鐘"
, "一小時零三十分鐘"
]
, examples (DurationData 130 Minute)
[ "兩小時十分"
, "一百三十分鐘"
]
, examples (DurationData 3615 Second)
[ "一小時零十五秒"
, "一個鐘零十五秒"
]
, examples (DurationData 45 Day)
[ "一個半月"
, "個半月"
]
, examples (DurationData 27 Month)
[ "兩年零三個月"
, "廿七個月"
]
, examples (DurationData 330 Second)
[ "五個半分鐘"
, "五點五分鐘"
, "5.5分鐘"
, "五分三十秒"
, "五分半鐘"
, "五分半"
]
, examples (DurationData 90 Second)
[ "一分半鐘"
, "一分半"
, "分半鐘"
, "分半"
]
, examples (DurationData 15 Minute)
[ "3個字"
, "三個字"
]
]

View File

@ -0,0 +1,301 @@
-- Copyright (c) 2016-present, Facebook, Inc.
-- All rights reserved.
--
-- This source code is licensed under the BSD-style license found in the
-- LICENSE file in the root directory of this source tree.
{-# LANGUAGE GADTs #-}
{-# LANGUAGE LambdaCase #-}
{-# LANGUAGE NoRebindableSyntax #-}
{-# LANGUAGE OverloadedStrings #-}
module Duckling.Duration.ZH.Rules
( rules
) where
import Prelude
import qualified Data.Text as Text
import Duckling.Dimensions.Types
import Duckling.Duration.Helpers
import Duckling.Duration.Types (DurationData(..))
import Duckling.Numeral.Helpers (parseInteger, decimalsToDouble)
import Duckling.Numeral.Types (NumeralData(..))
import Duckling.Regex.Types
import Duckling.Types
import qualified Duckling.Duration.Types as TDuration
import qualified Duckling.Numeral.Types as TNumeral
import qualified Duckling.TimeGrain.Types as TG
ruleDurationNFiveMinutes :: Rule
ruleDurationNFiveMinutes = Rule
{ name = "number of five minutes"
, pattern =
[ Predicate isNatural
, regex "個字"
]
, prod = \case
(Token Numeral NumeralData{TNumeral.value = v}:_) ->
Just $ Token Duration $ duration TG.Minute $ floor v * 5
_ -> Nothing
}
ruleDurationHalfATimeGrain :: Rule
ruleDurationHalfATimeGrain = Rule
{ name = "half a <time-grain>"
, pattern =
[ regex ""
, dimension TimeGrain
]
, prod = \case
(_:Token TimeGrain grain:_) -> Token Duration <$> nPlusOneHalf grain 0
_ -> Nothing
}
ruleDurationOneGrainAndHalf :: Rule
ruleDurationOneGrainAndHalf = Rule
{ name = "a <unit-of-duration> and a half"
, pattern =
[ regex "一個半|個半"
, dimension TimeGrain
]
, prod = \case
(_:Token TimeGrain grain:_) -> Token Duration <$> nPlusOneHalf grain 1
_ -> Nothing
}
ruleDurationOneGrainAndHalf2 :: Rule
ruleDurationOneGrainAndHalf2 = Rule
{ name = "a <unit-of-duration> and a half"
, pattern =
[ dimension TimeGrain
, regex "半(鐘)?"
]
, prod = \case
(Token TimeGrain grain:_) -> Token Duration <$> nPlusOneHalf grain 1
_ -> Nothing
}
ruleDurationAndHalfGrain :: Rule
ruleDurationAndHalfGrain = Rule
{ name = "<integer> and a half <unit-of-duration>"
, pattern =
[ Predicate isNatural
, dimension TimeGrain
, regex "半(鐘)?"
]
, prod = \case
(Token Numeral NumeralData{TNumeral.value = v}:Token TimeGrain grain:_) -> do
let vv = floor v
Token Duration <$> nPlusOneHalf grain vv
_ -> Nothing
}
ruleDurationAndHalfGrain2 :: Rule
ruleDurationAndHalfGrain2 = Rule
{ name = "<integer> and a half <unit-of-duration>"
, pattern =
[ Predicate isNatural
, regex "個半"
, dimension TimeGrain
]
, prod = \case
(Token Numeral NumeralData{TNumeral.value = v}:_:Token TimeGrain grain:_) -> do
let vv = floor v
Token Duration <$> nPlusOneHalf grain vv
_ -> Nothing
}
ruleDurationDotNumeralHours :: Rule
ruleDurationDotNumeralHours = Rule
{ name = "number.number hours"
, pattern =
[ regex "(\\d+)\\.(\\d+)"
, Predicate $ isGrain TG.Hour
]
, prod = \case
(Token RegexMatch (GroupMatch (h:m:_)):_) -> do
hh <- parseInteger h
mnum <- parseInteger m
let mden = 10 ^ Text.length m
Just $ Token Duration $ minutesFromHourMixedFraction hh mnum mden
_ -> Nothing
}
ruleDurationDotNumeralHours2 :: Rule
ruleDurationDotNumeralHours2 = Rule
{ name = "number.number hours"
, pattern =
[ Predicate isNatural
, regex ""
, Predicate isNatural
, Predicate $ isGrain TG.Hour
]
, prod = \tokens -> case tokens of
(Token Numeral NumeralData{TNumeral.value = m}:
_:
Token Numeral NumeralData{TNumeral.value = s}:
_) -> Just
$ Token Duration
$ duration TG.Minute
$ floor ((m + decimalsToDouble s) * 60)
_ -> Nothing
}
ruleDurationDotNumeralMinutes :: Rule
ruleDurationDotNumeralMinutes = Rule
{ name = "number.number minutes"
, pattern =
[ regex "(\\d+)\\.(\\d+)"
, Predicate $ isGrain TG.Minute
]
, prod = \case
(Token RegexMatch (GroupMatch (m:s:_)):_) -> do
mm <- parseInteger m
ss <- parseInteger s
let sden = 10 ^ Text.length s
Just $ Token Duration $ secondsFromHourMixedFraction mm ss sden
_ -> Nothing
}
ruleDurationDotNumeralMinutes2 :: Rule
ruleDurationDotNumeralMinutes2 = Rule
{ name = "number.number minutes"
, pattern =
[ Predicate isNatural
, regex ""
, Predicate isNatural
, Predicate $ isGrain TG.Minute
]
, prod = \tokens -> case tokens of
(Token Numeral NumeralData{TNumeral.value = m}:
_:
Token Numeral NumeralData{TNumeral.value = s}:
_) -> Just
$ Token Duration
$ duration TG.Second
$ floor ((m + decimalsToDouble s) * 60)
_ -> Nothing
}
ruleDurationHoursAndMinutes :: Rule
ruleDurationHoursAndMinutes = Rule
{ name = "<integer> hours and <integer> minutes"
, pattern =
[ Predicate isNatural
, Predicate $ isGrain TG.Hour
, Predicate isNatural
, Predicate $ isGrain TG.Minute
]
, prod = \case
(Token Numeral h:
_:
Token Numeral m:
_) -> Just
$ Token Duration
$ duration TG.Minute
$ floor (TNumeral.value m) + 60 * floor (TNumeral.value h)
_ -> Nothing
}
ruleDurationMinutesAndSeconds :: Rule
ruleDurationMinutesAndSeconds = Rule
{ name = "<integer> minutes and <integer> seconds"
, pattern =
[ Predicate isNatural
, Predicate $ isGrain TG.Minute
, Predicate isNatural
, Predicate $ isGrain TG.Second
]
, prod = \case
(Token Numeral m:
_:
Token Numeral s:
_) -> Just
$ Token Duration
$ duration TG.Second
$ floor (TNumeral.value s) + 60 * floor (TNumeral.value m)
_ -> Nothing
}
ruleDurationHoursAndSeconds :: Rule
ruleDurationHoursAndSeconds = Rule
{ name = "<integer> hours and <integer> seconds"
, pattern =
[ Predicate isNatural
, Predicate $ isGrain TG.Hour
, Predicate isNatural
, Predicate $ isGrain TG.Second
]
, prod = \case
(Token Numeral h:
_:
Token Numeral s:
_) -> Just
$ Token Duration
$ duration TG.Second
$ floor (TNumeral.value s) + 3600 * floor (TNumeral.value h)
_ -> Nothing
}
ruleDurationHoursAndMinutesAndSeconds :: Rule
ruleDurationHoursAndMinutesAndSeconds = Rule
{ name = "<integer> hours and <integer> minutes and <integer> seconds"
, pattern =
[ Predicate isNatural
, Predicate $ isGrain TG.Hour
, Predicate isNatural
, Predicate $ isGrain TG.Minute
, Predicate isNatural
, Predicate $ isGrain TG.Second
]
, prod = \case
(Token Numeral h:
_:
Token Numeral m:
_:
Token Numeral s:
_) -> Just
$ Token Duration
$ duration TG.Second
$ floor (TNumeral.value s)
+ 60 * floor (TNumeral.value m)
+ 3600 * floor (TNumeral.value h)
_ -> Nothing
}
ruleCompositeDurationAnd :: Rule
ruleCompositeDurationAnd = Rule
{ name = "composite <duration> and <duration>"
, pattern =
[ dimension Duration
, regex ""
, dimension Duration
]
, prod = \case
(Token Duration DurationData{TDuration.value = v, TDuration.grain = g}:
_:
Token Duration dd@DurationData{TDuration.grain = dg}:
_) | g > dg -> Just $ Token Duration $ duration g v <> dd
_ -> Nothing
}
rules :: [Rule]
rules =
[ ruleDurationNFiveMinutes
, ruleDurationHalfATimeGrain
, ruleDurationOneGrainAndHalf
, ruleDurationOneGrainAndHalf2
, ruleDurationAndHalfGrain
, ruleDurationAndHalfGrain2
, ruleDurationDotNumeralHours
, ruleDurationDotNumeralHours2
, ruleDurationDotNumeralMinutes
, ruleDurationDotNumeralMinutes2
, ruleDurationHoursAndMinutes
, ruleDurationMinutesAndSeconds
, ruleDurationHoursAndSeconds
, ruleDurationHoursAndMinutesAndSeconds
, ruleCompositeDurationAnd
]

View File

@ -35,6 +35,20 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of 5 minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.332204510175204,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer (0..10)",
-0.8979415932059586),
("hour", -0.7308875085427924),
("<integer> (latent time-of-day)<number>\20010/\20491",
-2.1972245773362196)],
n = 12},
koData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [], n = 0}}),
("\21360\24230\20016\25910\33410\31532\22235\22825",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
@ -64,11 +78,11 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("integer (numeric)",
Classifier{okData =
ClassData{prior = -0.535142931416697, unseen = -4.204692619390966,
ClassData{prior = -0.621403275701104, unseen = -4.204692619390966,
likelihoods = HashMap.fromList [("", 0.0)], n = 65},
koData =
ClassData{prior = -0.8808888048232392, unseen = -3.871201010907891,
likelihoods = HashMap.fromList [("", 0.0)], n = 46}}),
ClassData{prior = -0.7704388548615918, unseen = -4.060443010546419,
likelihoods = HashMap.fromList [("", 0.0)], n = 56}}),
("\21355\22622\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -145,29 +159,29 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("month (grain)",
Classifier{okData =
ClassData{prior = -1.0541605260972757,
ClassData{prior = -1.0840134892469568,
unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
koData =
ClassData{prior = -0.42845462633286313,
unseen = -3.8066624897703196,
likelihoods = HashMap.fromList [("", 0.0)], n = 43}}),
ClassData{prior = -0.41284521540578695,
unseen = -3.8501476017100584,
likelihoods = HashMap.fromList [("", 0.0)], n = 45}}),
("<time-of-day> o'clock",
Classifier{okData =
ClassData{prior = -0.4418327522790392, unseen = -3.044522437723423,
ClassData{prior = -1.2367626271489267, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.0296194171811581,
unseen = -2.5649493574615367,
ClassData{prior = -0.3429447511268303,
unseen = -3.8501476017100584,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 5}}),
n = 22}}),
("national day",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
@ -225,71 +239,73 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("intersect",
Classifier{okData =
ClassData{prior = -0.39204208777602373,
unseen = -5.198497031265826,
ClassData{prior = -0.3968813644167729, unseen = -5.247024072160486,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-3.58351893845611),
-3.632309102625542),
("year (numeric with year symbol)\20809\26126\33410",
-3.1135153092103742),
-3.1623054733798064),
("xxxx year<named-month> <day-of-month>", -3.855452653939752),
("year (numeric with year symbol)\25995\26376",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\20061\22812\33410",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)<named-month> <day-of-month>",
-2.3597435068339943),
-2.4085336710034264),
("year (numeric with year symbol)\22320\29699\19968\23567\26102",
-4.0943445622221),
("dayday", -2.4849066497880004),
("hourhour", -3.58351893845611),
("hourminute", -3.58351893845611),
-4.143134726391533),
("dayday", -2.5336968139574325),
("hourhour", -3.632309102625542),
("hourminute", -3.632309102625542),
("absorption of , after named day<named-month> <day-of-month>",
-2.4849066497880004),
-2.5336968139574325),
("year (numeric with year symbol)\22823\25995\26399",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\22235\26092\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\20303\26842\33410",
-4.0943445622221),
("dayminute", -3.58351893845611),
("tonight<time-of-day> o'clock", -3.58351893845611),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.58351893845611),
("yearday", -1.3217558399823195),
-4.143134726391533),
("dayminute", -3.632309102625542),
("tonight<time-of-day> o'clock", -3.632309102625542),
("yearday", -1.3099213823353166),
("year (numeric with year symbol)\19971\19971\33410",
-3.1135153092103742),
-3.1623054733798064),
("year (numeric with year symbol)\36926\36234\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\29369\22826\26032\24180",
-4.0943445622221),
("yearminute", -4.0943445622221)],
n = 75},
-4.143134726391533),
("yearminute", -4.143134726391533),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.632309102625542)],
n = 78},
koData =
ClassData{prior = -1.126011262856224, unseen = -4.634728988229636,
ClassData{prior = -1.1160040313799788, unseen = -4.700480365792417,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-2.4277482359480516),
("dayhour", -3.0155349008501706),
("daymonth", -2.5455312716044354),
-2.4941233048929243),
("dayhour", -3.0819099697950434),
("daymonth", -2.6119063405493077),
("year (numeric with year symbol)February",
-3.0155349008501706),
("year (numeric with year symbol)Sunday", -3.9318256327243257),
-3.0819099697950434),
("year (numeric with year symbol)Sunday", -3.9982007016691985),
("<dim time> <part-of-day><time-of-day> o'clock",
-3.5263605246161616),
("year (numeric with year symbol)April", -3.5263605246161616),
("hourhour", -3.5263605246161616),
("year (numeric with year symbol)March", -2.4277482359480516),
("hourminute", -3.0155349008501706),
("yearmonth", -1.916922612182061),
("dayminute", -3.0155349008501706),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.0155349008501706),
("yearday", -3.9318256327243257),
-3.592735593561034),
("year (numeric with year symbol)April", -3.592735593561034),
("hourhour", -3.592735593561034),
("xxxx yearFebruary", -3.9982007016691985),
("year (numeric with year symbol)March", -2.4941233048929243),
("hourminute", -3.0819099697950434),
("yearmonth", -1.8581345381729275),
("dayminute", -3.0819099697950434),
("xxxx yearMarch", -3.9982007016691985),
("yearday", -3.9982007016691985),
("absorption of , after named dayFebruary",
-2.5455312716044354)],
n = 36}}),
-2.6119063405493077),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.0819099697950434)],
n = 38}}),
("\20399\20029\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
@ -299,12 +315,13 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("year (grain)",
Classifier{okData =
ClassData{prior = -1.6625477377480489,
ClassData{prior = -1.6964492894237302,
unseen = -2.5649493574615367,
likelihoods = HashMap.fromList [("", 0.0)], n = 11},
koData =
ClassData{prior = -0.2102954088363608, unseen = -3.891820298110627,
likelihoods = HashMap.fromList [("", 0.0)], n = 47}}),
ClassData{prior = -0.2025242641114741,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("Saturday",
Classifier{okData =
ClassData{prior = -0.8754687373538999,
@ -460,26 +477,39 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("hh:mm (time-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5},
ClassData{prior = 0.0, unseen = -2.4849066497880004,
likelihoods = HashMap.fromList [("", 0.0)], n = 10},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
("relative (1-9) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -2.9444389791664407,
ClassData{prior = 0.0, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("integer (numeric)", -1.2809338454620642),
("integer (0..10)", -0.325422400434628)],
n = 16},
[("<integer> (latent time-of-day)integer (0..10)",
-0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.6094379124341003,
unseen = -1.9459101490553135,
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
Classifier{okData =
ClassData{prior = -0.3101549283038396,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList [("integer (numeric)", -0.1823215567939546)],
n = 4}}),
HashMap.fromList
[("integer (numeric)", -1.9740810260220096),
("integer (0..10)", -0.1823215567939546)],
n = 33},
koData =
ClassData{prior = -1.3217558399823195, unseen = -2.772588722239781,
likelihoods =
HashMap.fromList
[("integer (numeric)", -0.5108256237659907),
("one point 2", -1.0986122886681098)],
n = 12}}),
("\36926\36234\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -543,6 +573,26 @@ classifiers
ClassData{prior = -0.5625269981428811,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("relative (10-59) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.5465437063680699, unseen = -3.891820298110627,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7357067949787413),
("hour", -0.7357067949787413)],
n = 22},
koData =
ClassData{prior = -0.8649974374866046,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.750305594399894)],
n = 16}}),
("year (numeric with year symbol)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.891820298110627,
@ -673,8 +723,8 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 1}}),
("afternoon",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods = HashMap.fromList [("", 0.0)], n = 9},
ClassData{prior = 0.0, unseen = -3.367295829986474,
likelihoods = HashMap.fromList [("", 0.0)], n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -701,8 +751,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("February",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
ClassData{prior = 0.0, unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -727,8 +777,20 @@ classifiers
n = 23}}),
("minute (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.890371757896165,
ClassData{prior = -0.3184537311185346, unseen = -2.890371757896165,
likelihoods = HashMap.fromList [("", 0.0)], n = 16},
koData =
ClassData{prior = -1.2992829841302609,
unseen = -2.0794415416798357,
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("xxxx year",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)integer (0..10)integer (0..10)",
0.0)],
n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -749,62 +811,66 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<part-of-day> <dim time>",
Classifier{okData =
ClassData{prior = -0.6097655716208943, unseen = -4.07753744390572,
ClassData{prior = -0.7507762933965817, unseen = -4.859812404361672,
likelihoods =
HashMap.fromList
[("tonight<integer> (latent time-of-day)", -2.451005098112319),
("hourhour", -1.3523928094442093),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.6625477377480489),
("afternoon<time-of-day> o'clock", -2.6741486494265287),
("hourminute", -1.575536360758419),
[("tonight<integer> (latent time-of-day)", -3.242592351485517),
("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-1.7165360479904674),
("hourhour", -2.1439800628174073),
("afternoon<time-of-day> o'clock", -3.4657359027997265),
("hourminute", -1.0233888674305223),
("afternoon<integer> (latent time-of-day)",
-2.6741486494265287),
("afternoonhh:mm (time-of-day)", -3.367295829986474),
("tonight<time-of-day> o'clock", -2.451005098112319)],
n = 25},
-3.4657359027997265),
("afternoonrelative (1-9) minutes after|past <integer> (hour-of-day)",
-2.5494451709255714),
("afternoonhh:mm (time-of-day)", -3.7534179752515073),
("tonight<time-of-day> o'clock", -3.242592351485517),
("afternoonnumber of 5 minutes after|past <integer> (hour-of-day)",
-2.2870809064580806)],
n = 59},
koData =
ClassData{prior = -0.7841189587656721,
unseen = -3.9318256327243257,
ClassData{prior = -0.6386589952758756, unseen = -4.962844630259907,
likelihoods =
HashMap.fromList
[("hourhour", -1.4271163556401458),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.5141277326297755),
("afternoon<time-of-day> o'clock", -2.120263536200091),
("hourminute", -1.5141277326297755),
[("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-2.1226137135450447),
("hourhour", -1.024001424876935),
("afternoon<time-of-day> o'clock", -1.820332841672111),
("hourminute", -2.1226137135450447),
("afternoon<integer> (latent time-of-day)",
-1.9661128563728327)],
n = 21}}),
-1.5885312276147867)],
n = 66}}),
("<integer> <unit-of-duration>",
Classifier{okData =
ClassData{prior = -infinity, unseen = -3.044522437723423,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -6.12029741895095,
ClassData{prior = 0.0, unseen = -6.18826412308259,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342month (grain)",
-4.508659285607248),
("week", -2.8992213731731473),
("integer (0..10)month (grain)", -2.7168998163791924),
("integer (0..10)hour (grain)", -3.1736582188749076),
("<number>\20010/\20491week (grain)", -3.720201925242977),
("second", -3.4790398684260895),
("integer (0..10)day (grain)", -2.982602982112198),
("integer (0..10)year (grain)", -3.8155121050473024),
("<number>\20010/\20491month (grain)", -3.3455084758015667),
("integer (numeric)year (grain)", -2.246896187133457),
("integer (0..10)second (grain)", -3.4790398684260895),
("day", -2.982602982112198), ("year", -2.0750459302067976),
("integer (0..10)minute (grain)", -3.2848838539851317),
("hour", -2.982602982112198),
("integer (0..10)week (grain)", -3.410046996939138),
("month", -1.9437099281457109),
("<number>\20010/\20491hour (grain)", -4.508659285607248),
("integer (numeric)month (grain)", -3.2848838539851317),
("minute", -3.2848838539851317)],
n = 217}}),
-4.576770711466393),
("week", -2.967332799032293),
("integer (0..10)month (grain)", -2.720472721100767),
("integer (0..10)hour (grain)", -3.050714407971344),
("<number>\20010/\20491week (grain)", -3.788313351102123),
("second", -3.5471512942852352),
("integer (0..10)day (grain)", -3.050714407971344),
("integer (0..10)year (grain)", -3.7013019741124937),
("<number>\20010/\20491month (grain)", -3.4136199016607125),
("integer (numeric)year (grain)", -2.315007612992603),
("integer (0..10)second (grain)", -3.5471512942852352),
("day", -3.050714407971344), ("year", -2.1086711799947744),
("integer (0..10)minute (grain)", -3.050714407971344),
("hour", -3.050714407971344),
("integer (0..10)week (grain)", -3.4781584227982836),
("month", -1.9815160045095277),
("integer (numeric)month (grain)", -3.3529952798442775),
("integer with consecutive unit modifiersminute (grain)",
-4.24029847484518),
("minute", -2.81891279391402)],
n = 233}}),
("\32769\26495\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -821,56 +887,35 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<time-of-day> am|pm",
Classifier{okData =
ClassData{prior = -0.4700036292457356, unseen = -2.70805020110221,
ClassData{prior = -0.5596157879354228, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("hh:mm (time-of-day)", -1.252762968495368),
("<integer> (latent time-of-day)", -1.540445040947149),
("hour", -1.540445040947149), ("minute", -1.252762968495368)],
n = 5},
[("hh:mm (time-of-day)", -1.0498221244986778),
("<integer> (latent time-of-day)", -1.8971199848858813),
("hour", -1.8971199848858813), ("minute", -1.0498221244986778)],
n = 8},
koData =
ClassData{prior = -0.9808292530117262,
unseen = -2.3978952727983707,
ClassData{prior = -0.8472978603872037, unseen = -2.833213344056216,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.916290731874155),
("hour", -0.916290731874155)],
n = 3}}),
("relative minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7801585575495751),
("hour", -0.7801585575495751)],
n = 10},
koData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.7801585575495751)],
n = 10}}),
[("<integer> (latent time-of-day)", -0.8266785731844679),
("hour", -0.8266785731844679)],
n = 6}}),
("one point 2",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
ClassData{prior = -infinity, unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
ClassData{prior = 0.0, unseen = -3.5553480614894135,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -1.3217558399823195),
[("integer (0..10)integer (0..10)", -0.8873031950009028),
("integer (0..10)number suffix: \21313|\25342",
-1.3217558399823195),
-1.7346010553881064),
("integer (0..10)integer with consecutive unit modifiers",
-0.7621400520468967)],
n = 12}}),
-1.128465251817791),
("integer (0..10)<number>\20010/\20491", -2.4277482359480516)],
n = 30}}),
("intersect by \",\"",
Classifier{okData =
ClassData{prior = -0.40546510810816444,
@ -904,16 +949,20 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("integer with consecutive unit modifiers",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.367295829986474,
ClassData{prior = -5.715841383994864e-2,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342integer (0..10)",
-0.6931471805599453),
("integer (0..10)integer (0..10)", -0.6931471805599453)],
n = 26},
n = 34},
koData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -2.890371757896165, unseen = -1.6094379124341003,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -0.2876820724517809)],
n = 2}}),
("second (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.70805020110221,
@ -977,8 +1026,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("March",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [("", 0.0)], n = 14},
ClassData{prior = 0.0, unseen = -2.833213344056216,
likelihoods = HashMap.fromList [("", 0.0)], n = 15},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -991,11 +1040,12 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("the day after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
ClassData{prior = -0.5108256237659907,
unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [("", 0.0)], n = 3},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -0.916290731874155, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("\22307\21608\20845",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
@ -1076,27 +1126,25 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("next n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.61512051684126,
ClassData{prior = 0.0, unseen = -4.605170185988091,
likelihoods =
HashMap.fromList
[("week", -2.4079456086518722),
("integer (0..10)hour (grain)", -2.659260036932778),
("<number>\20010/\20491week (grain)", -2.995732273553991),
("second", -2.8134107167600364),
("integer (0..10)day (grain)", -2.5257286443082556),
("integer (0..10)year (grain)", -3.2188758248682006),
("<number>\20010/\20491month (grain)", -2.8134107167600364),
("integer (0..10)second (grain)", -2.8134107167600364),
("day", -2.5257286443082556), ("year", -3.2188758248682006),
("integer (0..10)minute (grain)", -2.659260036932778),
("hour", -2.4079456086518722),
("integer (0..10)week (grain)", -2.995732273553991),
("month", -2.8134107167600364),
("<number>\20010/\20491hour (grain)", -3.506557897319982),
("minute", -2.659260036932778)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.9856819377004897),
("second", -2.803360380906535),
("integer (0..10)day (grain)", -2.515678308454754),
("integer (0..10)year (grain)", -3.2088254890146994),
("<number>\20010/\20491month (grain)", -2.803360380906535),
("integer (0..10)second (grain)", -2.803360380906535),
("day", -2.515678308454754), ("year", -3.2088254890146994),
("integer (0..10)minute (grain)", -2.649209701079277),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.9856819377004897),
("month", -2.803360380906535), ("minute", -2.649209701079277)],
n = 42},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\19975\22307\33410",
Classifier{okData =
@ -1112,6 +1160,14 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of five minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)],
n = 2}}),
("\20799\31461\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -1134,6 +1190,18 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number.number minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods =
HashMap.fromList
[("integer (0..10)integer with consecutive unit modifiersminute (grain)",
-0.6931471805599453),
("minute", -0.6931471805599453)],
n = 4}}),
("\32822\31267\21463\38590\26085",
Classifier{okData =
ClassData{prior = -1.0296194171811581,
@ -1145,19 +1213,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 9}}),
("<named-month> <day-of-month>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.709530201312334,
ClassData{prior = 0.0, unseen = -4.762173934797756,
likelihoods =
HashMap.fromList
[("Marchinteger (0..10)", -2.6210388241125804),
("Marchinteger (numeric)", -3.0910424533583156),
("Aprilinteger (numeric)", -3.6018680771243066),
("Februaryinteger (0..10)", -2.6210388241125804),
("Februarynumber suffix: \21313|\25342", -2.6210388241125804),
("month", -0.7492366472109889),
("Februaryinteger (numeric)", -2.503255788456197),
[("Marchinteger (0..10)", -2.5563656137701454),
("Marchinteger (numeric)", -3.144152278672264),
("Aprilinteger (numeric)", -3.654977902438255),
("Februaryinteger (0..10)", -2.6741486494265287),
("Februarynumber suffix: \21313|\25342", -2.6741486494265287),
("month", -0.7462570058738938),
("Februaryinteger (numeric)", -2.5563656137701454),
("Februaryinteger with consecutive unit modifiers",
-1.8672670217362002)],
n = 51},
-1.8091512119399242)],
n = 54},
koData =
ClassData{prior = -infinity, unseen = -2.1972245773362196,
likelihoods = HashMap.fromList [], n = 0}}),
@ -1191,14 +1259,21 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("two days after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("integer (0..10)",
Classifier{okData =
ClassData{prior = -0.7055697005585025,
unseen = -5.0875963352323845,
likelihoods = HashMap.fromList [("", 0.0)], n = 160},
ClassData{prior = -0.6026331730191135,
unseen = -5.3471075307174685,
likelihoods = HashMap.fromList [("", 0.0)], n = 208},
koData =
ClassData{prior = -0.680877087968131, unseen = -5.111987788356543,
likelihoods = HashMap.fromList [("", 0.0)], n = 164}}),
ClassData{prior = -0.7926767759069784, unseen = -5.159055299214529,
likelihoods = HashMap.fromList [("", 0.0)], n = 172}}),
("last n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.605170185988091,
@ -1236,27 +1311,25 @@ classifiers
n = 10}}),
("n <cycle> last",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.04305126783455,
ClassData{prior = 0.0, unseen = -4.02535169073515,
likelihoods =
HashMap.fromList
[("week", -2.4159137783010487),
("integer (0..10)hour (grain)", -2.9267394020670396),
("<number>\20010/\20491week (grain)", -2.9267394020670396),
("second", -2.9267394020670396),
("integer (0..10)day (grain)", -2.4159137783010487),
("integer (0..10)year (grain)", -2.9267394020670396),
("<number>\20010/\20491month (grain)", -2.9267394020670396),
("integer (0..10)second (grain)", -2.9267394020670396),
("day", -2.4159137783010487), ("year", -2.9267394020670396),
("integer (0..10)minute (grain)", -2.9267394020670396),
("hour", -2.4159137783010487),
("integer (0..10)week (grain)", -2.9267394020670396),
("month", -2.9267394020670396),
("<number>\20010/\20491hour (grain)", -2.9267394020670396),
("minute", -2.9267394020670396)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.908720896564361),
("second", -2.908720896564361),
("integer (0..10)day (grain)", -2.3978952727983707),
("integer (0..10)year (grain)", -2.908720896564361),
("<number>\20010/\20491month (grain)", -2.908720896564361),
("integer (0..10)second (grain)", -2.908720896564361),
("day", -2.3978952727983707), ("year", -2.908720896564361),
("integer (0..10)minute (grain)", -2.908720896564361),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.908720896564361),
("month", -2.908720896564361), ("minute", -2.908720896564361)],
n = 20},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\24527\24724\33410",
Classifier{okData =
@ -1281,11 +1354,11 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("number suffix: \21313|\25342",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -3.0910424533583156,
likelihoods = HashMap.fromList [("", 0.0)], n = 20},
ClassData{prior = -0.18924199963852842,
unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -1.6094379124341003,
ClassData{prior = -1.7578579175523736,
unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5}}),
("\22320\29699\19968\23567\26102",
@ -1322,11 +1395,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("<number>\20010/\20491",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.4339872044851463,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)], n = 29},
ClassData{prior = -0.2006706954621511,
unseen = -3.4011973816621555,
likelihoods =
HashMap.fromList [("integer (0..10)", -3.509131981127006e-2)],
n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -1.7047480922384253,
unseen = -2.1972245773362196,
likelihoods =
HashMap.fromList
[("one point 2", -0.9808292530117262),
("integer (0..10)", -0.4700036292457356)],
n = 6}}),
("\24773\20154\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,

View File

@ -35,6 +35,20 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of 5 minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.332204510175204,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer (0..10)",
-0.8979415932059586),
("hour", -0.7308875085427924),
("<integer> (latent time-of-day)<number>\20010/\20491",
-2.1972245773362196)],
n = 12},
koData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [], n = 0}}),
("\21360\24230\20016\25910\33410\31532\22235\22825",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
@ -64,11 +78,11 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("integer (numeric)",
Classifier{okData =
ClassData{prior = -0.535142931416697, unseen = -4.204692619390966,
ClassData{prior = -0.621403275701104, unseen = -4.204692619390966,
likelihoods = HashMap.fromList [("", 0.0)], n = 65},
koData =
ClassData{prior = -0.8808888048232392, unseen = -3.871201010907891,
likelihoods = HashMap.fromList [("", 0.0)], n = 46}}),
ClassData{prior = -0.7704388548615918, unseen = -4.060443010546419,
likelihoods = HashMap.fromList [("", 0.0)], n = 56}}),
("\21355\22622\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -145,29 +159,29 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("month (grain)",
Classifier{okData =
ClassData{prior = -1.0541605260972757,
ClassData{prior = -1.0840134892469568,
unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
koData =
ClassData{prior = -0.42845462633286313,
unseen = -3.8066624897703196,
likelihoods = HashMap.fromList [("", 0.0)], n = 43}}),
ClassData{prior = -0.41284521540578695,
unseen = -3.8501476017100584,
likelihoods = HashMap.fromList [("", 0.0)], n = 45}}),
("<time-of-day> o'clock",
Classifier{okData =
ClassData{prior = -0.4418327522790392, unseen = -3.044522437723423,
ClassData{prior = -1.2367626271489267, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.0296194171811581,
unseen = -2.5649493574615367,
ClassData{prior = -0.3429447511268303,
unseen = -3.8501476017100584,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 5}}),
n = 22}}),
("national day",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
@ -225,71 +239,73 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("intersect",
Classifier{okData =
ClassData{prior = -0.39204208777602373,
unseen = -5.198497031265826,
ClassData{prior = -0.3968813644167729, unseen = -5.247024072160486,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-3.58351893845611),
-3.632309102625542),
("year (numeric with year symbol)\20809\26126\33410",
-3.1135153092103742),
-3.1623054733798064),
("xxxx year<named-month> <day-of-month>", -3.855452653939752),
("year (numeric with year symbol)\25995\26376",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\20061\22812\33410",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)<named-month> <day-of-month>",
-2.3597435068339943),
-2.4085336710034264),
("year (numeric with year symbol)\22320\29699\19968\23567\26102",
-4.0943445622221),
("dayday", -2.4849066497880004),
("hourhour", -3.58351893845611),
("hourminute", -3.58351893845611),
-4.143134726391533),
("dayday", -2.5336968139574325),
("hourhour", -3.632309102625542),
("hourminute", -3.632309102625542),
("absorption of , after named day<named-month> <day-of-month>",
-2.4849066497880004),
-2.5336968139574325),
("year (numeric with year symbol)\22823\25995\26399",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\22235\26092\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\20303\26842\33410",
-4.0943445622221),
("dayminute", -3.58351893845611),
("tonight<time-of-day> o'clock", -3.58351893845611),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.58351893845611),
("yearday", -1.3217558399823195),
-4.143134726391533),
("dayminute", -3.632309102625542),
("tonight<time-of-day> o'clock", -3.632309102625542),
("yearday", -1.3099213823353166),
("year (numeric with year symbol)\19971\19971\33410",
-3.1135153092103742),
-3.1623054733798064),
("year (numeric with year symbol)\36926\36234\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\29369\22826\26032\24180",
-4.0943445622221),
("yearminute", -4.0943445622221)],
n = 75},
-4.143134726391533),
("yearminute", -4.143134726391533),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.632309102625542)],
n = 78},
koData =
ClassData{prior = -1.126011262856224, unseen = -4.634728988229636,
ClassData{prior = -1.1160040313799788, unseen = -4.700480365792417,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-2.4277482359480516),
("dayhour", -3.0155349008501706),
("daymonth", -2.5455312716044354),
-2.4941233048929243),
("dayhour", -3.0819099697950434),
("daymonth", -2.6119063405493077),
("year (numeric with year symbol)February",
-3.0155349008501706),
("year (numeric with year symbol)Sunday", -3.9318256327243257),
-3.0819099697950434),
("year (numeric with year symbol)Sunday", -3.9982007016691985),
("<dim time> <part-of-day><time-of-day> o'clock",
-3.5263605246161616),
("year (numeric with year symbol)April", -3.5263605246161616),
("hourhour", -3.5263605246161616),
("year (numeric with year symbol)March", -2.4277482359480516),
("hourminute", -3.0155349008501706),
("yearmonth", -1.916922612182061),
("dayminute", -3.0155349008501706),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.0155349008501706),
("yearday", -3.9318256327243257),
-3.592735593561034),
("year (numeric with year symbol)April", -3.592735593561034),
("hourhour", -3.592735593561034),
("xxxx yearFebruary", -3.9982007016691985),
("year (numeric with year symbol)March", -2.4941233048929243),
("hourminute", -3.0819099697950434),
("yearmonth", -1.8581345381729275),
("dayminute", -3.0819099697950434),
("xxxx yearMarch", -3.9982007016691985),
("yearday", -3.9982007016691985),
("absorption of , after named dayFebruary",
-2.5455312716044354)],
n = 36}}),
-2.6119063405493077),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.0819099697950434)],
n = 38}}),
("\20399\20029\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
@ -299,12 +315,13 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("year (grain)",
Classifier{okData =
ClassData{prior = -1.6625477377480489,
ClassData{prior = -1.6964492894237302,
unseen = -2.5649493574615367,
likelihoods = HashMap.fromList [("", 0.0)], n = 11},
koData =
ClassData{prior = -0.2102954088363608, unseen = -3.891820298110627,
likelihoods = HashMap.fromList [("", 0.0)], n = 47}}),
ClassData{prior = -0.2025242641114741,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("Saturday",
Classifier{okData =
ClassData{prior = -0.8754687373538999,
@ -460,26 +477,39 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("hh:mm (time-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5},
ClassData{prior = 0.0, unseen = -2.4849066497880004,
likelihoods = HashMap.fromList [("", 0.0)], n = 10},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
("relative (1-9) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -2.9444389791664407,
ClassData{prior = 0.0, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("integer (numeric)", -1.2809338454620642),
("integer (0..10)", -0.325422400434628)],
n = 16},
[("<integer> (latent time-of-day)integer (0..10)",
-0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.6094379124341003,
unseen = -1.9459101490553135,
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
Classifier{okData =
ClassData{prior = -0.3101549283038396,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList [("integer (numeric)", -0.1823215567939546)],
n = 4}}),
HashMap.fromList
[("integer (numeric)", -1.9740810260220096),
("integer (0..10)", -0.1823215567939546)],
n = 33},
koData =
ClassData{prior = -1.3217558399823195, unseen = -2.772588722239781,
likelihoods =
HashMap.fromList
[("integer (numeric)", -0.5108256237659907),
("one point 2", -1.0986122886681098)],
n = 12}}),
("\36926\36234\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -543,6 +573,26 @@ classifiers
ClassData{prior = -0.5625269981428811,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("relative (10-59) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.5465437063680699, unseen = -3.891820298110627,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7357067949787413),
("hour", -0.7357067949787413)],
n = 22},
koData =
ClassData{prior = -0.8649974374866046,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.750305594399894)],
n = 16}}),
("year (numeric with year symbol)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.891820298110627,
@ -673,8 +723,8 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 1}}),
("afternoon",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods = HashMap.fromList [("", 0.0)], n = 9},
ClassData{prior = 0.0, unseen = -3.367295829986474,
likelihoods = HashMap.fromList [("", 0.0)], n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -701,8 +751,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("February",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
ClassData{prior = 0.0, unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -727,8 +777,20 @@ classifiers
n = 23}}),
("minute (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.890371757896165,
ClassData{prior = -0.3184537311185346, unseen = -2.890371757896165,
likelihoods = HashMap.fromList [("", 0.0)], n = 16},
koData =
ClassData{prior = -1.2992829841302609,
unseen = -2.0794415416798357,
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("xxxx year",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)integer (0..10)integer (0..10)",
0.0)],
n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -749,62 +811,66 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<part-of-day> <dim time>",
Classifier{okData =
ClassData{prior = -0.6097655716208943, unseen = -4.07753744390572,
ClassData{prior = -0.7507762933965817, unseen = -4.859812404361672,
likelihoods =
HashMap.fromList
[("tonight<integer> (latent time-of-day)", -2.451005098112319),
("hourhour", -1.3523928094442093),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.6625477377480489),
("afternoon<time-of-day> o'clock", -2.6741486494265287),
("hourminute", -1.575536360758419),
[("tonight<integer> (latent time-of-day)", -3.242592351485517),
("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-1.7165360479904674),
("hourhour", -2.1439800628174073),
("afternoon<time-of-day> o'clock", -3.4657359027997265),
("hourminute", -1.0233888674305223),
("afternoon<integer> (latent time-of-day)",
-2.6741486494265287),
("afternoonhh:mm (time-of-day)", -3.367295829986474),
("tonight<time-of-day> o'clock", -2.451005098112319)],
n = 25},
-3.4657359027997265),
("afternoonrelative (1-9) minutes after|past <integer> (hour-of-day)",
-2.5494451709255714),
("afternoonhh:mm (time-of-day)", -3.7534179752515073),
("tonight<time-of-day> o'clock", -3.242592351485517),
("afternoonnumber of 5 minutes after|past <integer> (hour-of-day)",
-2.2870809064580806)],
n = 59},
koData =
ClassData{prior = -0.7841189587656721,
unseen = -3.9318256327243257,
ClassData{prior = -0.6386589952758756, unseen = -4.962844630259907,
likelihoods =
HashMap.fromList
[("hourhour", -1.4271163556401458),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.5141277326297755),
("afternoon<time-of-day> o'clock", -2.120263536200091),
("hourminute", -1.5141277326297755),
[("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-2.1226137135450447),
("hourhour", -1.024001424876935),
("afternoon<time-of-day> o'clock", -1.820332841672111),
("hourminute", -2.1226137135450447),
("afternoon<integer> (latent time-of-day)",
-1.9661128563728327)],
n = 21}}),
-1.5885312276147867)],
n = 66}}),
("<integer> <unit-of-duration>",
Classifier{okData =
ClassData{prior = -infinity, unseen = -3.044522437723423,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -6.12029741895095,
ClassData{prior = 0.0, unseen = -6.18826412308259,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342month (grain)",
-4.508659285607248),
("week", -2.8992213731731473),
("integer (0..10)month (grain)", -2.7168998163791924),
("integer (0..10)hour (grain)", -3.1736582188749076),
("<number>\20010/\20491week (grain)", -3.720201925242977),
("second", -3.4790398684260895),
("integer (0..10)day (grain)", -2.982602982112198),
("integer (0..10)year (grain)", -3.8155121050473024),
("<number>\20010/\20491month (grain)", -3.3455084758015667),
("integer (numeric)year (grain)", -2.246896187133457),
("integer (0..10)second (grain)", -3.4790398684260895),
("day", -2.982602982112198), ("year", -2.0750459302067976),
("integer (0..10)minute (grain)", -3.2848838539851317),
("hour", -2.982602982112198),
("integer (0..10)week (grain)", -3.410046996939138),
("month", -1.9437099281457109),
("<number>\20010/\20491hour (grain)", -4.508659285607248),
("integer (numeric)month (grain)", -3.2848838539851317),
("minute", -3.2848838539851317)],
n = 217}}),
-4.576770711466393),
("week", -2.967332799032293),
("integer (0..10)month (grain)", -2.720472721100767),
("integer (0..10)hour (grain)", -3.050714407971344),
("<number>\20010/\20491week (grain)", -3.788313351102123),
("second", -3.5471512942852352),
("integer (0..10)day (grain)", -3.050714407971344),
("integer (0..10)year (grain)", -3.7013019741124937),
("<number>\20010/\20491month (grain)", -3.4136199016607125),
("integer (numeric)year (grain)", -2.315007612992603),
("integer (0..10)second (grain)", -3.5471512942852352),
("day", -3.050714407971344), ("year", -2.1086711799947744),
("integer (0..10)minute (grain)", -3.050714407971344),
("hour", -3.050714407971344),
("integer (0..10)week (grain)", -3.4781584227982836),
("month", -1.9815160045095277),
("integer (numeric)month (grain)", -3.3529952798442775),
("integer with consecutive unit modifiersminute (grain)",
-4.24029847484518),
("minute", -2.81891279391402)],
n = 233}}),
("\32769\26495\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -821,56 +887,35 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<time-of-day> am|pm",
Classifier{okData =
ClassData{prior = -0.4700036292457356, unseen = -2.70805020110221,
ClassData{prior = -0.5596157879354228, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("hh:mm (time-of-day)", -1.252762968495368),
("<integer> (latent time-of-day)", -1.540445040947149),
("hour", -1.540445040947149), ("minute", -1.252762968495368)],
n = 5},
[("hh:mm (time-of-day)", -1.0498221244986778),
("<integer> (latent time-of-day)", -1.8971199848858813),
("hour", -1.8971199848858813), ("minute", -1.0498221244986778)],
n = 8},
koData =
ClassData{prior = -0.9808292530117262,
unseen = -2.3978952727983707,
ClassData{prior = -0.8472978603872037, unseen = -2.833213344056216,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.916290731874155),
("hour", -0.916290731874155)],
n = 3}}),
("relative minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7801585575495751),
("hour", -0.7801585575495751)],
n = 10},
koData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.7801585575495751)],
n = 10}}),
[("<integer> (latent time-of-day)", -0.8266785731844679),
("hour", -0.8266785731844679)],
n = 6}}),
("one point 2",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
ClassData{prior = -infinity, unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
ClassData{prior = 0.0, unseen = -3.5553480614894135,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -1.3217558399823195),
[("integer (0..10)integer (0..10)", -0.8873031950009028),
("integer (0..10)number suffix: \21313|\25342",
-1.3217558399823195),
-1.7346010553881064),
("integer (0..10)integer with consecutive unit modifiers",
-0.7621400520468967)],
n = 12}}),
-1.128465251817791),
("integer (0..10)<number>\20010/\20491", -2.4277482359480516)],
n = 30}}),
("intersect by \",\"",
Classifier{okData =
ClassData{prior = -0.40546510810816444,
@ -904,16 +949,20 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("integer with consecutive unit modifiers",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.367295829986474,
ClassData{prior = -5.715841383994864e-2,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342integer (0..10)",
-0.6931471805599453),
("integer (0..10)integer (0..10)", -0.6931471805599453)],
n = 26},
n = 34},
koData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -2.890371757896165, unseen = -1.6094379124341003,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -0.2876820724517809)],
n = 2}}),
("second (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.70805020110221,
@ -977,8 +1026,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("March",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [("", 0.0)], n = 14},
ClassData{prior = 0.0, unseen = -2.833213344056216,
likelihoods = HashMap.fromList [("", 0.0)], n = 15},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -991,11 +1040,12 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("the day after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
ClassData{prior = -0.5108256237659907,
unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [("", 0.0)], n = 3},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -0.916290731874155, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("\22307\21608\20845",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
@ -1076,27 +1126,25 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("next n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.61512051684126,
ClassData{prior = 0.0, unseen = -4.605170185988091,
likelihoods =
HashMap.fromList
[("week", -2.4079456086518722),
("integer (0..10)hour (grain)", -2.659260036932778),
("<number>\20010/\20491week (grain)", -2.995732273553991),
("second", -2.8134107167600364),
("integer (0..10)day (grain)", -2.5257286443082556),
("integer (0..10)year (grain)", -3.2188758248682006),
("<number>\20010/\20491month (grain)", -2.8134107167600364),
("integer (0..10)second (grain)", -2.8134107167600364),
("day", -2.5257286443082556), ("year", -3.2188758248682006),
("integer (0..10)minute (grain)", -2.659260036932778),
("hour", -2.4079456086518722),
("integer (0..10)week (grain)", -2.995732273553991),
("month", -2.8134107167600364),
("<number>\20010/\20491hour (grain)", -3.506557897319982),
("minute", -2.659260036932778)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.9856819377004897),
("second", -2.803360380906535),
("integer (0..10)day (grain)", -2.515678308454754),
("integer (0..10)year (grain)", -3.2088254890146994),
("<number>\20010/\20491month (grain)", -2.803360380906535),
("integer (0..10)second (grain)", -2.803360380906535),
("day", -2.515678308454754), ("year", -3.2088254890146994),
("integer (0..10)minute (grain)", -2.649209701079277),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.9856819377004897),
("month", -2.803360380906535), ("minute", -2.649209701079277)],
n = 42},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\19975\22307\33410",
Classifier{okData =
@ -1112,6 +1160,14 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of five minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)],
n = 2}}),
("\20799\31461\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -1134,6 +1190,18 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number.number minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods =
HashMap.fromList
[("integer (0..10)integer with consecutive unit modifiersminute (grain)",
-0.6931471805599453),
("minute", -0.6931471805599453)],
n = 4}}),
("\32822\31267\21463\38590\26085",
Classifier{okData =
ClassData{prior = -1.0296194171811581,
@ -1145,19 +1213,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 9}}),
("<named-month> <day-of-month>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.709530201312334,
ClassData{prior = 0.0, unseen = -4.762173934797756,
likelihoods =
HashMap.fromList
[("Marchinteger (0..10)", -2.6210388241125804),
("Marchinteger (numeric)", -3.0910424533583156),
("Aprilinteger (numeric)", -3.6018680771243066),
("Februaryinteger (0..10)", -2.6210388241125804),
("Februarynumber suffix: \21313|\25342", -2.6210388241125804),
("month", -0.7492366472109889),
("Februaryinteger (numeric)", -2.503255788456197),
[("Marchinteger (0..10)", -2.5563656137701454),
("Marchinteger (numeric)", -3.144152278672264),
("Aprilinteger (numeric)", -3.654977902438255),
("Februaryinteger (0..10)", -2.6741486494265287),
("Februarynumber suffix: \21313|\25342", -2.6741486494265287),
("month", -0.7462570058738938),
("Februaryinteger (numeric)", -2.5563656137701454),
("Februaryinteger with consecutive unit modifiers",
-1.8672670217362002)],
n = 51},
-1.8091512119399242)],
n = 54},
koData =
ClassData{prior = -infinity, unseen = -2.1972245773362196,
likelihoods = HashMap.fromList [], n = 0}}),
@ -1191,14 +1259,21 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("two days after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("integer (0..10)",
Classifier{okData =
ClassData{prior = -0.7055697005585025,
unseen = -5.0875963352323845,
likelihoods = HashMap.fromList [("", 0.0)], n = 160},
ClassData{prior = -0.6026331730191135,
unseen = -5.3471075307174685,
likelihoods = HashMap.fromList [("", 0.0)], n = 208},
koData =
ClassData{prior = -0.680877087968131, unseen = -5.111987788356543,
likelihoods = HashMap.fromList [("", 0.0)], n = 164}}),
ClassData{prior = -0.7926767759069784, unseen = -5.159055299214529,
likelihoods = HashMap.fromList [("", 0.0)], n = 172}}),
("last n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.605170185988091,
@ -1236,27 +1311,25 @@ classifiers
n = 10}}),
("n <cycle> last",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.04305126783455,
ClassData{prior = 0.0, unseen = -4.02535169073515,
likelihoods =
HashMap.fromList
[("week", -2.4159137783010487),
("integer (0..10)hour (grain)", -2.9267394020670396),
("<number>\20010/\20491week (grain)", -2.9267394020670396),
("second", -2.9267394020670396),
("integer (0..10)day (grain)", -2.4159137783010487),
("integer (0..10)year (grain)", -2.9267394020670396),
("<number>\20010/\20491month (grain)", -2.9267394020670396),
("integer (0..10)second (grain)", -2.9267394020670396),
("day", -2.4159137783010487), ("year", -2.9267394020670396),
("integer (0..10)minute (grain)", -2.9267394020670396),
("hour", -2.4159137783010487),
("integer (0..10)week (grain)", -2.9267394020670396),
("month", -2.9267394020670396),
("<number>\20010/\20491hour (grain)", -2.9267394020670396),
("minute", -2.9267394020670396)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.908720896564361),
("second", -2.908720896564361),
("integer (0..10)day (grain)", -2.3978952727983707),
("integer (0..10)year (grain)", -2.908720896564361),
("<number>\20010/\20491month (grain)", -2.908720896564361),
("integer (0..10)second (grain)", -2.908720896564361),
("day", -2.3978952727983707), ("year", -2.908720896564361),
("integer (0..10)minute (grain)", -2.908720896564361),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.908720896564361),
("month", -2.908720896564361), ("minute", -2.908720896564361)],
n = 20},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\24527\24724\33410",
Classifier{okData =
@ -1281,11 +1354,11 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("number suffix: \21313|\25342",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -3.0910424533583156,
likelihoods = HashMap.fromList [("", 0.0)], n = 20},
ClassData{prior = -0.18924199963852842,
unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -1.6094379124341003,
ClassData{prior = -1.7578579175523736,
unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5}}),
("\22320\29699\19968\23567\26102",
@ -1322,11 +1395,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("<number>\20010/\20491",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.4339872044851463,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)], n = 29},
ClassData{prior = -0.2006706954621511,
unseen = -3.4011973816621555,
likelihoods =
HashMap.fromList [("integer (0..10)", -3.509131981127006e-2)],
n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -1.7047480922384253,
unseen = -2.1972245773362196,
likelihoods =
HashMap.fromList
[("one point 2", -0.9808292530117262),
("integer (0..10)", -0.4700036292457356)],
n = 6}}),
("\24773\20154\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,

View File

@ -35,6 +35,20 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of 5 minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.332204510175204,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer (0..10)",
-0.8979415932059586),
("hour", -0.7308875085427924),
("<integer> (latent time-of-day)<number>\20010/\20491",
-2.1972245773362196)],
n = 12},
koData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [], n = 0}}),
("\21360\24230\20016\25910\33410\31532\22235\22825",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
@ -64,11 +78,11 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("integer (numeric)",
Classifier{okData =
ClassData{prior = -0.535142931416697, unseen = -4.204692619390966,
ClassData{prior = -0.621403275701104, unseen = -4.204692619390966,
likelihoods = HashMap.fromList [("", 0.0)], n = 65},
koData =
ClassData{prior = -0.8808888048232392, unseen = -3.871201010907891,
likelihoods = HashMap.fromList [("", 0.0)], n = 46}}),
ClassData{prior = -0.7704388548615918, unseen = -4.060443010546419,
likelihoods = HashMap.fromList [("", 0.0)], n = 56}}),
("\21355\22622\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -145,29 +159,29 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("month (grain)",
Classifier{okData =
ClassData{prior = -1.0541605260972757,
ClassData{prior = -1.0840134892469568,
unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
koData =
ClassData{prior = -0.42845462633286313,
unseen = -3.8066624897703196,
likelihoods = HashMap.fromList [("", 0.0)], n = 43}}),
ClassData{prior = -0.41284521540578695,
unseen = -3.8501476017100584,
likelihoods = HashMap.fromList [("", 0.0)], n = 45}}),
("<time-of-day> o'clock",
Classifier{okData =
ClassData{prior = -0.4418327522790392, unseen = -3.044522437723423,
ClassData{prior = -1.2367626271489267, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.0296194171811581,
unseen = -2.5649493574615367,
ClassData{prior = -0.3429447511268303,
unseen = -3.8501476017100584,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 5}}),
n = 22}}),
("national day",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
@ -225,71 +239,73 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("intersect",
Classifier{okData =
ClassData{prior = -0.39204208777602373,
unseen = -5.198497031265826,
ClassData{prior = -0.3968813644167729, unseen = -5.247024072160486,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-3.58351893845611),
-3.632309102625542),
("year (numeric with year symbol)\20809\26126\33410",
-3.1135153092103742),
-3.1623054733798064),
("xxxx year<named-month> <day-of-month>", -3.855452653939752),
("year (numeric with year symbol)\25995\26376",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\20061\22812\33410",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)<named-month> <day-of-month>",
-2.3597435068339943),
-2.4085336710034264),
("year (numeric with year symbol)\22320\29699\19968\23567\26102",
-4.0943445622221),
("dayday", -2.4849066497880004),
("hourhour", -3.58351893845611),
("hourminute", -3.58351893845611),
-4.143134726391533),
("dayday", -2.5336968139574325),
("hourhour", -3.632309102625542),
("hourminute", -3.632309102625542),
("absorption of , after named day<named-month> <day-of-month>",
-2.4849066497880004),
-2.5336968139574325),
("year (numeric with year symbol)\22823\25995\26399",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\22235\26092\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\20303\26842\33410",
-4.0943445622221),
("dayminute", -3.58351893845611),
("tonight<time-of-day> o'clock", -3.58351893845611),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.58351893845611),
("yearday", -1.3217558399823195),
-4.143134726391533),
("dayminute", -3.632309102625542),
("tonight<time-of-day> o'clock", -3.632309102625542),
("yearday", -1.3099213823353166),
("year (numeric with year symbol)\19971\19971\33410",
-3.1135153092103742),
-3.1623054733798064),
("year (numeric with year symbol)\36926\36234\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\29369\22826\26032\24180",
-4.0943445622221),
("yearminute", -4.0943445622221)],
n = 75},
-4.143134726391533),
("yearminute", -4.143134726391533),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.632309102625542)],
n = 78},
koData =
ClassData{prior = -1.126011262856224, unseen = -4.634728988229636,
ClassData{prior = -1.1160040313799788, unseen = -4.700480365792417,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-2.4277482359480516),
("dayhour", -3.0155349008501706),
("daymonth", -2.5455312716044354),
-2.4941233048929243),
("dayhour", -3.0819099697950434),
("daymonth", -2.6119063405493077),
("year (numeric with year symbol)February",
-3.0155349008501706),
("year (numeric with year symbol)Sunday", -3.9318256327243257),
-3.0819099697950434),
("year (numeric with year symbol)Sunday", -3.9982007016691985),
("<dim time> <part-of-day><time-of-day> o'clock",
-3.5263605246161616),
("year (numeric with year symbol)April", -3.5263605246161616),
("hourhour", -3.5263605246161616),
("year (numeric with year symbol)March", -2.4277482359480516),
("hourminute", -3.0155349008501706),
("yearmonth", -1.916922612182061),
("dayminute", -3.0155349008501706),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.0155349008501706),
("yearday", -3.9318256327243257),
-3.592735593561034),
("year (numeric with year symbol)April", -3.592735593561034),
("hourhour", -3.592735593561034),
("xxxx yearFebruary", -3.9982007016691985),
("year (numeric with year symbol)March", -2.4941233048929243),
("hourminute", -3.0819099697950434),
("yearmonth", -1.8581345381729275),
("dayminute", -3.0819099697950434),
("xxxx yearMarch", -3.9982007016691985),
("yearday", -3.9982007016691985),
("absorption of , after named dayFebruary",
-2.5455312716044354)],
n = 36}}),
-2.6119063405493077),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.0819099697950434)],
n = 38}}),
("\20399\20029\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
@ -299,12 +315,13 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("year (grain)",
Classifier{okData =
ClassData{prior = -1.6625477377480489,
ClassData{prior = -1.6964492894237302,
unseen = -2.5649493574615367,
likelihoods = HashMap.fromList [("", 0.0)], n = 11},
koData =
ClassData{prior = -0.2102954088363608, unseen = -3.891820298110627,
likelihoods = HashMap.fromList [("", 0.0)], n = 47}}),
ClassData{prior = -0.2025242641114741,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("Saturday",
Classifier{okData =
ClassData{prior = -0.8754687373538999,
@ -460,26 +477,39 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("hh:mm (time-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5},
ClassData{prior = 0.0, unseen = -2.4849066497880004,
likelihoods = HashMap.fromList [("", 0.0)], n = 10},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
("relative (1-9) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -2.9444389791664407,
ClassData{prior = 0.0, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("integer (numeric)", -1.2809338454620642),
("integer (0..10)", -0.325422400434628)],
n = 16},
[("<integer> (latent time-of-day)integer (0..10)",
-0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.6094379124341003,
unseen = -1.9459101490553135,
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
Classifier{okData =
ClassData{prior = -0.3101549283038396,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList [("integer (numeric)", -0.1823215567939546)],
n = 4}}),
HashMap.fromList
[("integer (numeric)", -1.9740810260220096),
("integer (0..10)", -0.1823215567939546)],
n = 33},
koData =
ClassData{prior = -1.3217558399823195, unseen = -2.772588722239781,
likelihoods =
HashMap.fromList
[("integer (numeric)", -0.5108256237659907),
("one point 2", -1.0986122886681098)],
n = 12}}),
("\36926\36234\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -543,6 +573,26 @@ classifiers
ClassData{prior = -0.5625269981428811,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("relative (10-59) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.5465437063680699, unseen = -3.891820298110627,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7357067949787413),
("hour", -0.7357067949787413)],
n = 22},
koData =
ClassData{prior = -0.8649974374866046,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.750305594399894)],
n = 16}}),
("year (numeric with year symbol)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.891820298110627,
@ -673,8 +723,8 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 1}}),
("afternoon",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods = HashMap.fromList [("", 0.0)], n = 9},
ClassData{prior = 0.0, unseen = -3.367295829986474,
likelihoods = HashMap.fromList [("", 0.0)], n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -701,8 +751,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("February",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
ClassData{prior = 0.0, unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -727,8 +777,20 @@ classifiers
n = 23}}),
("minute (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.890371757896165,
ClassData{prior = -0.3184537311185346, unseen = -2.890371757896165,
likelihoods = HashMap.fromList [("", 0.0)], n = 16},
koData =
ClassData{prior = -1.2992829841302609,
unseen = -2.0794415416798357,
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("xxxx year",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)integer (0..10)integer (0..10)",
0.0)],
n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -749,62 +811,66 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<part-of-day> <dim time>",
Classifier{okData =
ClassData{prior = -0.6097655716208943, unseen = -4.07753744390572,
ClassData{prior = -0.7507762933965817, unseen = -4.859812404361672,
likelihoods =
HashMap.fromList
[("tonight<integer> (latent time-of-day)", -2.451005098112319),
("hourhour", -1.3523928094442093),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.6625477377480489),
("afternoon<time-of-day> o'clock", -2.6741486494265287),
("hourminute", -1.575536360758419),
[("tonight<integer> (latent time-of-day)", -3.242592351485517),
("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-1.7165360479904674),
("hourhour", -2.1439800628174073),
("afternoon<time-of-day> o'clock", -3.4657359027997265),
("hourminute", -1.0233888674305223),
("afternoon<integer> (latent time-of-day)",
-2.6741486494265287),
("afternoonhh:mm (time-of-day)", -3.367295829986474),
("tonight<time-of-day> o'clock", -2.451005098112319)],
n = 25},
-3.4657359027997265),
("afternoonrelative (1-9) minutes after|past <integer> (hour-of-day)",
-2.5494451709255714),
("afternoonhh:mm (time-of-day)", -3.7534179752515073),
("tonight<time-of-day> o'clock", -3.242592351485517),
("afternoonnumber of 5 minutes after|past <integer> (hour-of-day)",
-2.2870809064580806)],
n = 59},
koData =
ClassData{prior = -0.7841189587656721,
unseen = -3.9318256327243257,
ClassData{prior = -0.6386589952758756, unseen = -4.962844630259907,
likelihoods =
HashMap.fromList
[("hourhour", -1.4271163556401458),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.5141277326297755),
("afternoon<time-of-day> o'clock", -2.120263536200091),
("hourminute", -1.5141277326297755),
[("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-2.1226137135450447),
("hourhour", -1.024001424876935),
("afternoon<time-of-day> o'clock", -1.820332841672111),
("hourminute", -2.1226137135450447),
("afternoon<integer> (latent time-of-day)",
-1.9661128563728327)],
n = 21}}),
-1.5885312276147867)],
n = 66}}),
("<integer> <unit-of-duration>",
Classifier{okData =
ClassData{prior = -infinity, unseen = -3.044522437723423,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -6.12029741895095,
ClassData{prior = 0.0, unseen = -6.18826412308259,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342month (grain)",
-4.508659285607248),
("week", -2.8992213731731473),
("integer (0..10)month (grain)", -2.7168998163791924),
("integer (0..10)hour (grain)", -3.1736582188749076),
("<number>\20010/\20491week (grain)", -3.720201925242977),
("second", -3.4790398684260895),
("integer (0..10)day (grain)", -2.982602982112198),
("integer (0..10)year (grain)", -3.8155121050473024),
("<number>\20010/\20491month (grain)", -3.3455084758015667),
("integer (numeric)year (grain)", -2.246896187133457),
("integer (0..10)second (grain)", -3.4790398684260895),
("day", -2.982602982112198), ("year", -2.0750459302067976),
("integer (0..10)minute (grain)", -3.2848838539851317),
("hour", -2.982602982112198),
("integer (0..10)week (grain)", -3.410046996939138),
("month", -1.9437099281457109),
("<number>\20010/\20491hour (grain)", -4.508659285607248),
("integer (numeric)month (grain)", -3.2848838539851317),
("minute", -3.2848838539851317)],
n = 217}}),
-4.576770711466393),
("week", -2.967332799032293),
("integer (0..10)month (grain)", -2.720472721100767),
("integer (0..10)hour (grain)", -3.050714407971344),
("<number>\20010/\20491week (grain)", -3.788313351102123),
("second", -3.5471512942852352),
("integer (0..10)day (grain)", -3.050714407971344),
("integer (0..10)year (grain)", -3.7013019741124937),
("<number>\20010/\20491month (grain)", -3.4136199016607125),
("integer (numeric)year (grain)", -2.315007612992603),
("integer (0..10)second (grain)", -3.5471512942852352),
("day", -3.050714407971344), ("year", -2.1086711799947744),
("integer (0..10)minute (grain)", -3.050714407971344),
("hour", -3.050714407971344),
("integer (0..10)week (grain)", -3.4781584227982836),
("month", -1.9815160045095277),
("integer (numeric)month (grain)", -3.3529952798442775),
("integer with consecutive unit modifiersminute (grain)",
-4.24029847484518),
("minute", -2.81891279391402)],
n = 233}}),
("\32769\26495\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -821,56 +887,35 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<time-of-day> am|pm",
Classifier{okData =
ClassData{prior = -0.4700036292457356, unseen = -2.70805020110221,
ClassData{prior = -0.5596157879354228, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("hh:mm (time-of-day)", -1.252762968495368),
("<integer> (latent time-of-day)", -1.540445040947149),
("hour", -1.540445040947149), ("minute", -1.252762968495368)],
n = 5},
[("hh:mm (time-of-day)", -1.0498221244986778),
("<integer> (latent time-of-day)", -1.8971199848858813),
("hour", -1.8971199848858813), ("minute", -1.0498221244986778)],
n = 8},
koData =
ClassData{prior = -0.9808292530117262,
unseen = -2.3978952727983707,
ClassData{prior = -0.8472978603872037, unseen = -2.833213344056216,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.916290731874155),
("hour", -0.916290731874155)],
n = 3}}),
("relative minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7801585575495751),
("hour", -0.7801585575495751)],
n = 10},
koData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.7801585575495751)],
n = 10}}),
[("<integer> (latent time-of-day)", -0.8266785731844679),
("hour", -0.8266785731844679)],
n = 6}}),
("one point 2",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
ClassData{prior = -infinity, unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
ClassData{prior = 0.0, unseen = -3.5553480614894135,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -1.3217558399823195),
[("integer (0..10)integer (0..10)", -0.8873031950009028),
("integer (0..10)number suffix: \21313|\25342",
-1.3217558399823195),
-1.7346010553881064),
("integer (0..10)integer with consecutive unit modifiers",
-0.7621400520468967)],
n = 12}}),
-1.128465251817791),
("integer (0..10)<number>\20010/\20491", -2.4277482359480516)],
n = 30}}),
("intersect by \",\"",
Classifier{okData =
ClassData{prior = -0.40546510810816444,
@ -904,16 +949,20 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("integer with consecutive unit modifiers",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.367295829986474,
ClassData{prior = -5.715841383994864e-2,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342integer (0..10)",
-0.6931471805599453),
("integer (0..10)integer (0..10)", -0.6931471805599453)],
n = 26},
n = 34},
koData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -2.890371757896165, unseen = -1.6094379124341003,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -0.2876820724517809)],
n = 2}}),
("second (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.70805020110221,
@ -977,8 +1026,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("March",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [("", 0.0)], n = 14},
ClassData{prior = 0.0, unseen = -2.833213344056216,
likelihoods = HashMap.fromList [("", 0.0)], n = 15},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -991,11 +1040,12 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("the day after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
ClassData{prior = -0.5108256237659907,
unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [("", 0.0)], n = 3},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -0.916290731874155, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("\22307\21608\20845",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
@ -1076,27 +1126,25 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("next n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.61512051684126,
ClassData{prior = 0.0, unseen = -4.605170185988091,
likelihoods =
HashMap.fromList
[("week", -2.4079456086518722),
("integer (0..10)hour (grain)", -2.659260036932778),
("<number>\20010/\20491week (grain)", -2.995732273553991),
("second", -2.8134107167600364),
("integer (0..10)day (grain)", -2.5257286443082556),
("integer (0..10)year (grain)", -3.2188758248682006),
("<number>\20010/\20491month (grain)", -2.8134107167600364),
("integer (0..10)second (grain)", -2.8134107167600364),
("day", -2.5257286443082556), ("year", -3.2188758248682006),
("integer (0..10)minute (grain)", -2.659260036932778),
("hour", -2.4079456086518722),
("integer (0..10)week (grain)", -2.995732273553991),
("month", -2.8134107167600364),
("<number>\20010/\20491hour (grain)", -3.506557897319982),
("minute", -2.659260036932778)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.9856819377004897),
("second", -2.803360380906535),
("integer (0..10)day (grain)", -2.515678308454754),
("integer (0..10)year (grain)", -3.2088254890146994),
("<number>\20010/\20491month (grain)", -2.803360380906535),
("integer (0..10)second (grain)", -2.803360380906535),
("day", -2.515678308454754), ("year", -3.2088254890146994),
("integer (0..10)minute (grain)", -2.649209701079277),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.9856819377004897),
("month", -2.803360380906535), ("minute", -2.649209701079277)],
n = 42},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\19975\22307\33410",
Classifier{okData =
@ -1112,6 +1160,14 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of five minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)],
n = 2}}),
("\20799\31461\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -1134,6 +1190,18 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number.number minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods =
HashMap.fromList
[("integer (0..10)integer with consecutive unit modifiersminute (grain)",
-0.6931471805599453),
("minute", -0.6931471805599453)],
n = 4}}),
("\32822\31267\21463\38590\26085",
Classifier{okData =
ClassData{prior = -1.0296194171811581,
@ -1145,19 +1213,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 9}}),
("<named-month> <day-of-month>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.709530201312334,
ClassData{prior = 0.0, unseen = -4.762173934797756,
likelihoods =
HashMap.fromList
[("Marchinteger (0..10)", -2.6210388241125804),
("Marchinteger (numeric)", -3.0910424533583156),
("Aprilinteger (numeric)", -3.6018680771243066),
("Februaryinteger (0..10)", -2.6210388241125804),
("Februarynumber suffix: \21313|\25342", -2.6210388241125804),
("month", -0.7492366472109889),
("Februaryinteger (numeric)", -2.503255788456197),
[("Marchinteger (0..10)", -2.5563656137701454),
("Marchinteger (numeric)", -3.144152278672264),
("Aprilinteger (numeric)", -3.654977902438255),
("Februaryinteger (0..10)", -2.6741486494265287),
("Februarynumber suffix: \21313|\25342", -2.6741486494265287),
("month", -0.7462570058738938),
("Februaryinteger (numeric)", -2.5563656137701454),
("Februaryinteger with consecutive unit modifiers",
-1.8672670217362002)],
n = 51},
-1.8091512119399242)],
n = 54},
koData =
ClassData{prior = -infinity, unseen = -2.1972245773362196,
likelihoods = HashMap.fromList [], n = 0}}),
@ -1191,14 +1259,21 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("two days after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("integer (0..10)",
Classifier{okData =
ClassData{prior = -0.7055697005585025,
unseen = -5.0875963352323845,
likelihoods = HashMap.fromList [("", 0.0)], n = 160},
ClassData{prior = -0.6026331730191135,
unseen = -5.3471075307174685,
likelihoods = HashMap.fromList [("", 0.0)], n = 208},
koData =
ClassData{prior = -0.680877087968131, unseen = -5.111987788356543,
likelihoods = HashMap.fromList [("", 0.0)], n = 164}}),
ClassData{prior = -0.7926767759069784, unseen = -5.159055299214529,
likelihoods = HashMap.fromList [("", 0.0)], n = 172}}),
("last n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.605170185988091,
@ -1236,27 +1311,25 @@ classifiers
n = 10}}),
("n <cycle> last",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.04305126783455,
ClassData{prior = 0.0, unseen = -4.02535169073515,
likelihoods =
HashMap.fromList
[("week", -2.4159137783010487),
("integer (0..10)hour (grain)", -2.9267394020670396),
("<number>\20010/\20491week (grain)", -2.9267394020670396),
("second", -2.9267394020670396),
("integer (0..10)day (grain)", -2.4159137783010487),
("integer (0..10)year (grain)", -2.9267394020670396),
("<number>\20010/\20491month (grain)", -2.9267394020670396),
("integer (0..10)second (grain)", -2.9267394020670396),
("day", -2.4159137783010487), ("year", -2.9267394020670396),
("integer (0..10)minute (grain)", -2.9267394020670396),
("hour", -2.4159137783010487),
("integer (0..10)week (grain)", -2.9267394020670396),
("month", -2.9267394020670396),
("<number>\20010/\20491hour (grain)", -2.9267394020670396),
("minute", -2.9267394020670396)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.908720896564361),
("second", -2.908720896564361),
("integer (0..10)day (grain)", -2.3978952727983707),
("integer (0..10)year (grain)", -2.908720896564361),
("<number>\20010/\20491month (grain)", -2.908720896564361),
("integer (0..10)second (grain)", -2.908720896564361),
("day", -2.3978952727983707), ("year", -2.908720896564361),
("integer (0..10)minute (grain)", -2.908720896564361),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.908720896564361),
("month", -2.908720896564361), ("minute", -2.908720896564361)],
n = 20},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\24527\24724\33410",
Classifier{okData =
@ -1281,11 +1354,11 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("number suffix: \21313|\25342",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -3.0910424533583156,
likelihoods = HashMap.fromList [("", 0.0)], n = 20},
ClassData{prior = -0.18924199963852842,
unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -1.6094379124341003,
ClassData{prior = -1.7578579175523736,
unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5}}),
("\22320\29699\19968\23567\26102",
@ -1322,11 +1395,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("<number>\20010/\20491",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.4339872044851463,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)], n = 29},
ClassData{prior = -0.2006706954621511,
unseen = -3.4011973816621555,
likelihoods =
HashMap.fromList [("integer (0..10)", -3.509131981127006e-2)],
n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -1.7047480922384253,
unseen = -2.1972245773362196,
likelihoods =
HashMap.fromList
[("one point 2", -0.9808292530117262),
("integer (0..10)", -0.4700036292457356)],
n = 6}}),
("\24773\20154\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,

View File

@ -35,6 +35,20 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of 5 minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.332204510175204,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer (0..10)",
-0.8979415932059586),
("hour", -0.7308875085427924),
("<integer> (latent time-of-day)<number>\20010/\20491",
-2.1972245773362196)],
n = 12},
koData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [], n = 0}}),
("\21360\24230\20016\25910\33410\31532\22235\22825",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
@ -64,11 +78,11 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("integer (numeric)",
Classifier{okData =
ClassData{prior = -0.535142931416697, unseen = -4.204692619390966,
ClassData{prior = -0.621403275701104, unseen = -4.204692619390966,
likelihoods = HashMap.fromList [("", 0.0)], n = 65},
koData =
ClassData{prior = -0.8808888048232392, unseen = -3.871201010907891,
likelihoods = HashMap.fromList [("", 0.0)], n = 46}}),
ClassData{prior = -0.7704388548615918, unseen = -4.060443010546419,
likelihoods = HashMap.fromList [("", 0.0)], n = 56}}),
("\21355\22622\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -145,29 +159,29 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("month (grain)",
Classifier{okData =
ClassData{prior = -1.0541605260972757,
ClassData{prior = -1.0840134892469568,
unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
koData =
ClassData{prior = -0.42845462633286313,
unseen = -3.8066624897703196,
likelihoods = HashMap.fromList [("", 0.0)], n = 43}}),
ClassData{prior = -0.41284521540578695,
unseen = -3.8501476017100584,
likelihoods = HashMap.fromList [("", 0.0)], n = 45}}),
("<time-of-day> o'clock",
Classifier{okData =
ClassData{prior = -0.4418327522790392, unseen = -3.044522437723423,
ClassData{prior = -1.2367626271489267, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.0296194171811581,
unseen = -2.5649493574615367,
ClassData{prior = -0.3429447511268303,
unseen = -3.8501476017100584,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 5}}),
n = 22}}),
("national day",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
@ -225,71 +239,73 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("intersect",
Classifier{okData =
ClassData{prior = -0.39204208777602373,
unseen = -5.198497031265826,
ClassData{prior = -0.3968813644167729, unseen = -5.247024072160486,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-3.58351893845611),
-3.632309102625542),
("year (numeric with year symbol)\20809\26126\33410",
-3.1135153092103742),
-3.1623054733798064),
("xxxx year<named-month> <day-of-month>", -3.855452653939752),
("year (numeric with year symbol)\25995\26376",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\20061\22812\33410",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)<named-month> <day-of-month>",
-2.3597435068339943),
-2.4085336710034264),
("year (numeric with year symbol)\22320\29699\19968\23567\26102",
-4.0943445622221),
("dayday", -2.4849066497880004),
("hourhour", -3.58351893845611),
("hourminute", -3.58351893845611),
-4.143134726391533),
("dayday", -2.5336968139574325),
("hourhour", -3.632309102625542),
("hourminute", -3.632309102625542),
("absorption of , after named day<named-month> <day-of-month>",
-2.4849066497880004),
-2.5336968139574325),
("year (numeric with year symbol)\22823\25995\26399",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\22235\26092\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\20303\26842\33410",
-4.0943445622221),
("dayminute", -3.58351893845611),
("tonight<time-of-day> o'clock", -3.58351893845611),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.58351893845611),
("yearday", -1.3217558399823195),
-4.143134726391533),
("dayminute", -3.632309102625542),
("tonight<time-of-day> o'clock", -3.632309102625542),
("yearday", -1.3099213823353166),
("year (numeric with year symbol)\19971\19971\33410",
-3.1135153092103742),
-3.1623054733798064),
("year (numeric with year symbol)\36926\36234\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\29369\22826\26032\24180",
-4.0943445622221),
("yearminute", -4.0943445622221)],
n = 75},
-4.143134726391533),
("yearminute", -4.143134726391533),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.632309102625542)],
n = 78},
koData =
ClassData{prior = -1.126011262856224, unseen = -4.634728988229636,
ClassData{prior = -1.1160040313799788, unseen = -4.700480365792417,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-2.4277482359480516),
("dayhour", -3.0155349008501706),
("daymonth", -2.5455312716044354),
-2.4941233048929243),
("dayhour", -3.0819099697950434),
("daymonth", -2.6119063405493077),
("year (numeric with year symbol)February",
-3.0155349008501706),
("year (numeric with year symbol)Sunday", -3.9318256327243257),
-3.0819099697950434),
("year (numeric with year symbol)Sunday", -3.9982007016691985),
("<dim time> <part-of-day><time-of-day> o'clock",
-3.5263605246161616),
("year (numeric with year symbol)April", -3.5263605246161616),
("hourhour", -3.5263605246161616),
("year (numeric with year symbol)March", -2.4277482359480516),
("hourminute", -3.0155349008501706),
("yearmonth", -1.916922612182061),
("dayminute", -3.0155349008501706),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.0155349008501706),
("yearday", -3.9318256327243257),
-3.592735593561034),
("year (numeric with year symbol)April", -3.592735593561034),
("hourhour", -3.592735593561034),
("xxxx yearFebruary", -3.9982007016691985),
("year (numeric with year symbol)March", -2.4941233048929243),
("hourminute", -3.0819099697950434),
("yearmonth", -1.8581345381729275),
("dayminute", -3.0819099697950434),
("xxxx yearMarch", -3.9982007016691985),
("yearday", -3.9982007016691985),
("absorption of , after named dayFebruary",
-2.5455312716044354)],
n = 36}}),
-2.6119063405493077),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.0819099697950434)],
n = 38}}),
("\20399\20029\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
@ -299,12 +315,13 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("year (grain)",
Classifier{okData =
ClassData{prior = -1.6625477377480489,
ClassData{prior = -1.6964492894237302,
unseen = -2.5649493574615367,
likelihoods = HashMap.fromList [("", 0.0)], n = 11},
koData =
ClassData{prior = -0.2102954088363608, unseen = -3.891820298110627,
likelihoods = HashMap.fromList [("", 0.0)], n = 47}}),
ClassData{prior = -0.2025242641114741,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("Saturday",
Classifier{okData =
ClassData{prior = -0.8754687373538999,
@ -460,26 +477,39 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("hh:mm (time-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5},
ClassData{prior = 0.0, unseen = -2.4849066497880004,
likelihoods = HashMap.fromList [("", 0.0)], n = 10},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
("relative (1-9) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -2.9444389791664407,
ClassData{prior = 0.0, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("integer (numeric)", -1.2809338454620642),
("integer (0..10)", -0.325422400434628)],
n = 16},
[("<integer> (latent time-of-day)integer (0..10)",
-0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.6094379124341003,
unseen = -1.9459101490553135,
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
Classifier{okData =
ClassData{prior = -0.3101549283038396,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList [("integer (numeric)", -0.1823215567939546)],
n = 4}}),
HashMap.fromList
[("integer (numeric)", -1.9740810260220096),
("integer (0..10)", -0.1823215567939546)],
n = 33},
koData =
ClassData{prior = -1.3217558399823195, unseen = -2.772588722239781,
likelihoods =
HashMap.fromList
[("integer (numeric)", -0.5108256237659907),
("one point 2", -1.0986122886681098)],
n = 12}}),
("\36926\36234\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -543,6 +573,26 @@ classifiers
ClassData{prior = -0.5625269981428811,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("relative (10-59) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.5465437063680699, unseen = -3.891820298110627,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7357067949787413),
("hour", -0.7357067949787413)],
n = 22},
koData =
ClassData{prior = -0.8649974374866046,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.750305594399894)],
n = 16}}),
("year (numeric with year symbol)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.891820298110627,
@ -673,8 +723,8 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 1}}),
("afternoon",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods = HashMap.fromList [("", 0.0)], n = 9},
ClassData{prior = 0.0, unseen = -3.367295829986474,
likelihoods = HashMap.fromList [("", 0.0)], n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -701,8 +751,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("February",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
ClassData{prior = 0.0, unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -727,8 +777,20 @@ classifiers
n = 23}}),
("minute (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.890371757896165,
ClassData{prior = -0.3184537311185346, unseen = -2.890371757896165,
likelihoods = HashMap.fromList [("", 0.0)], n = 16},
koData =
ClassData{prior = -1.2992829841302609,
unseen = -2.0794415416798357,
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("xxxx year",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)integer (0..10)integer (0..10)",
0.0)],
n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -749,62 +811,66 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<part-of-day> <dim time>",
Classifier{okData =
ClassData{prior = -0.6097655716208943, unseen = -4.07753744390572,
ClassData{prior = -0.7507762933965817, unseen = -4.859812404361672,
likelihoods =
HashMap.fromList
[("tonight<integer> (latent time-of-day)", -2.451005098112319),
("hourhour", -1.3523928094442093),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.6625477377480489),
("afternoon<time-of-day> o'clock", -2.6741486494265287),
("hourminute", -1.575536360758419),
[("tonight<integer> (latent time-of-day)", -3.242592351485517),
("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-1.7165360479904674),
("hourhour", -2.1439800628174073),
("afternoon<time-of-day> o'clock", -3.4657359027997265),
("hourminute", -1.0233888674305223),
("afternoon<integer> (latent time-of-day)",
-2.6741486494265287),
("afternoonhh:mm (time-of-day)", -3.367295829986474),
("tonight<time-of-day> o'clock", -2.451005098112319)],
n = 25},
-3.4657359027997265),
("afternoonrelative (1-9) minutes after|past <integer> (hour-of-day)",
-2.5494451709255714),
("afternoonhh:mm (time-of-day)", -3.7534179752515073),
("tonight<time-of-day> o'clock", -3.242592351485517),
("afternoonnumber of 5 minutes after|past <integer> (hour-of-day)",
-2.2870809064580806)],
n = 59},
koData =
ClassData{prior = -0.7841189587656721,
unseen = -3.9318256327243257,
ClassData{prior = -0.6386589952758756, unseen = -4.962844630259907,
likelihoods =
HashMap.fromList
[("hourhour", -1.4271163556401458),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.5141277326297755),
("afternoon<time-of-day> o'clock", -2.120263536200091),
("hourminute", -1.5141277326297755),
[("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-2.1226137135450447),
("hourhour", -1.024001424876935),
("afternoon<time-of-day> o'clock", -1.820332841672111),
("hourminute", -2.1226137135450447),
("afternoon<integer> (latent time-of-day)",
-1.9661128563728327)],
n = 21}}),
-1.5885312276147867)],
n = 66}}),
("<integer> <unit-of-duration>",
Classifier{okData =
ClassData{prior = -infinity, unseen = -3.044522437723423,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -6.12029741895095,
ClassData{prior = 0.0, unseen = -6.18826412308259,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342month (grain)",
-4.508659285607248),
("week", -2.8992213731731473),
("integer (0..10)month (grain)", -2.7168998163791924),
("integer (0..10)hour (grain)", -3.1736582188749076),
("<number>\20010/\20491week (grain)", -3.720201925242977),
("second", -3.4790398684260895),
("integer (0..10)day (grain)", -2.982602982112198),
("integer (0..10)year (grain)", -3.8155121050473024),
("<number>\20010/\20491month (grain)", -3.3455084758015667),
("integer (numeric)year (grain)", -2.246896187133457),
("integer (0..10)second (grain)", -3.4790398684260895),
("day", -2.982602982112198), ("year", -2.0750459302067976),
("integer (0..10)minute (grain)", -3.2848838539851317),
("hour", -2.982602982112198),
("integer (0..10)week (grain)", -3.410046996939138),
("month", -1.9437099281457109),
("<number>\20010/\20491hour (grain)", -4.508659285607248),
("integer (numeric)month (grain)", -3.2848838539851317),
("minute", -3.2848838539851317)],
n = 217}}),
-4.576770711466393),
("week", -2.967332799032293),
("integer (0..10)month (grain)", -2.720472721100767),
("integer (0..10)hour (grain)", -3.050714407971344),
("<number>\20010/\20491week (grain)", -3.788313351102123),
("second", -3.5471512942852352),
("integer (0..10)day (grain)", -3.050714407971344),
("integer (0..10)year (grain)", -3.7013019741124937),
("<number>\20010/\20491month (grain)", -3.4136199016607125),
("integer (numeric)year (grain)", -2.315007612992603),
("integer (0..10)second (grain)", -3.5471512942852352),
("day", -3.050714407971344), ("year", -2.1086711799947744),
("integer (0..10)minute (grain)", -3.050714407971344),
("hour", -3.050714407971344),
("integer (0..10)week (grain)", -3.4781584227982836),
("month", -1.9815160045095277),
("integer (numeric)month (grain)", -3.3529952798442775),
("integer with consecutive unit modifiersminute (grain)",
-4.24029847484518),
("minute", -2.81891279391402)],
n = 233}}),
("\32769\26495\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -821,56 +887,35 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<time-of-day> am|pm",
Classifier{okData =
ClassData{prior = -0.4700036292457356, unseen = -2.70805020110221,
ClassData{prior = -0.5596157879354228, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("hh:mm (time-of-day)", -1.252762968495368),
("<integer> (latent time-of-day)", -1.540445040947149),
("hour", -1.540445040947149), ("minute", -1.252762968495368)],
n = 5},
[("hh:mm (time-of-day)", -1.0498221244986778),
("<integer> (latent time-of-day)", -1.8971199848858813),
("hour", -1.8971199848858813), ("minute", -1.0498221244986778)],
n = 8},
koData =
ClassData{prior = -0.9808292530117262,
unseen = -2.3978952727983707,
ClassData{prior = -0.8472978603872037, unseen = -2.833213344056216,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.916290731874155),
("hour", -0.916290731874155)],
n = 3}}),
("relative minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7801585575495751),
("hour", -0.7801585575495751)],
n = 10},
koData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.7801585575495751)],
n = 10}}),
[("<integer> (latent time-of-day)", -0.8266785731844679),
("hour", -0.8266785731844679)],
n = 6}}),
("one point 2",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
ClassData{prior = -infinity, unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
ClassData{prior = 0.0, unseen = -3.5553480614894135,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -1.3217558399823195),
[("integer (0..10)integer (0..10)", -0.8873031950009028),
("integer (0..10)number suffix: \21313|\25342",
-1.3217558399823195),
-1.7346010553881064),
("integer (0..10)integer with consecutive unit modifiers",
-0.7621400520468967)],
n = 12}}),
-1.128465251817791),
("integer (0..10)<number>\20010/\20491", -2.4277482359480516)],
n = 30}}),
("intersect by \",\"",
Classifier{okData =
ClassData{prior = -0.40546510810816444,
@ -904,16 +949,20 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("integer with consecutive unit modifiers",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.367295829986474,
ClassData{prior = -5.715841383994864e-2,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342integer (0..10)",
-0.6931471805599453),
("integer (0..10)integer (0..10)", -0.6931471805599453)],
n = 26},
n = 34},
koData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -2.890371757896165, unseen = -1.6094379124341003,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -0.2876820724517809)],
n = 2}}),
("second (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.70805020110221,
@ -977,8 +1026,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("March",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [("", 0.0)], n = 14},
ClassData{prior = 0.0, unseen = -2.833213344056216,
likelihoods = HashMap.fromList [("", 0.0)], n = 15},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -991,11 +1040,12 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("the day after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
ClassData{prior = -0.5108256237659907,
unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [("", 0.0)], n = 3},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -0.916290731874155, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("\22307\21608\20845",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
@ -1076,27 +1126,25 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("next n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.61512051684126,
ClassData{prior = 0.0, unseen = -4.605170185988091,
likelihoods =
HashMap.fromList
[("week", -2.4079456086518722),
("integer (0..10)hour (grain)", -2.659260036932778),
("<number>\20010/\20491week (grain)", -2.995732273553991),
("second", -2.8134107167600364),
("integer (0..10)day (grain)", -2.5257286443082556),
("integer (0..10)year (grain)", -3.2188758248682006),
("<number>\20010/\20491month (grain)", -2.8134107167600364),
("integer (0..10)second (grain)", -2.8134107167600364),
("day", -2.5257286443082556), ("year", -3.2188758248682006),
("integer (0..10)minute (grain)", -2.659260036932778),
("hour", -2.4079456086518722),
("integer (0..10)week (grain)", -2.995732273553991),
("month", -2.8134107167600364),
("<number>\20010/\20491hour (grain)", -3.506557897319982),
("minute", -2.659260036932778)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.9856819377004897),
("second", -2.803360380906535),
("integer (0..10)day (grain)", -2.515678308454754),
("integer (0..10)year (grain)", -3.2088254890146994),
("<number>\20010/\20491month (grain)", -2.803360380906535),
("integer (0..10)second (grain)", -2.803360380906535),
("day", -2.515678308454754), ("year", -3.2088254890146994),
("integer (0..10)minute (grain)", -2.649209701079277),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.9856819377004897),
("month", -2.803360380906535), ("minute", -2.649209701079277)],
n = 42},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\19975\22307\33410",
Classifier{okData =
@ -1112,6 +1160,14 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of five minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)],
n = 2}}),
("\20799\31461\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -1134,6 +1190,18 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number.number minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods =
HashMap.fromList
[("integer (0..10)integer with consecutive unit modifiersminute (grain)",
-0.6931471805599453),
("minute", -0.6931471805599453)],
n = 4}}),
("\32822\31267\21463\38590\26085",
Classifier{okData =
ClassData{prior = -1.0296194171811581,
@ -1145,19 +1213,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 9}}),
("<named-month> <day-of-month>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.709530201312334,
ClassData{prior = 0.0, unseen = -4.762173934797756,
likelihoods =
HashMap.fromList
[("Marchinteger (0..10)", -2.6210388241125804),
("Marchinteger (numeric)", -3.0910424533583156),
("Aprilinteger (numeric)", -3.6018680771243066),
("Februaryinteger (0..10)", -2.6210388241125804),
("Februarynumber suffix: \21313|\25342", -2.6210388241125804),
("month", -0.7492366472109889),
("Februaryinteger (numeric)", -2.503255788456197),
[("Marchinteger (0..10)", -2.5563656137701454),
("Marchinteger (numeric)", -3.144152278672264),
("Aprilinteger (numeric)", -3.654977902438255),
("Februaryinteger (0..10)", -2.6741486494265287),
("Februarynumber suffix: \21313|\25342", -2.6741486494265287),
("month", -0.7462570058738938),
("Februaryinteger (numeric)", -2.5563656137701454),
("Februaryinteger with consecutive unit modifiers",
-1.8672670217362002)],
n = 51},
-1.8091512119399242)],
n = 54},
koData =
ClassData{prior = -infinity, unseen = -2.1972245773362196,
likelihoods = HashMap.fromList [], n = 0}}),
@ -1191,14 +1259,21 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("two days after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("integer (0..10)",
Classifier{okData =
ClassData{prior = -0.7055697005585025,
unseen = -5.0875963352323845,
likelihoods = HashMap.fromList [("", 0.0)], n = 160},
ClassData{prior = -0.6026331730191135,
unseen = -5.3471075307174685,
likelihoods = HashMap.fromList [("", 0.0)], n = 208},
koData =
ClassData{prior = -0.680877087968131, unseen = -5.111987788356543,
likelihoods = HashMap.fromList [("", 0.0)], n = 164}}),
ClassData{prior = -0.7926767759069784, unseen = -5.159055299214529,
likelihoods = HashMap.fromList [("", 0.0)], n = 172}}),
("last n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.605170185988091,
@ -1236,27 +1311,25 @@ classifiers
n = 10}}),
("n <cycle> last",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.04305126783455,
ClassData{prior = 0.0, unseen = -4.02535169073515,
likelihoods =
HashMap.fromList
[("week", -2.4159137783010487),
("integer (0..10)hour (grain)", -2.9267394020670396),
("<number>\20010/\20491week (grain)", -2.9267394020670396),
("second", -2.9267394020670396),
("integer (0..10)day (grain)", -2.4159137783010487),
("integer (0..10)year (grain)", -2.9267394020670396),
("<number>\20010/\20491month (grain)", -2.9267394020670396),
("integer (0..10)second (grain)", -2.9267394020670396),
("day", -2.4159137783010487), ("year", -2.9267394020670396),
("integer (0..10)minute (grain)", -2.9267394020670396),
("hour", -2.4159137783010487),
("integer (0..10)week (grain)", -2.9267394020670396),
("month", -2.9267394020670396),
("<number>\20010/\20491hour (grain)", -2.9267394020670396),
("minute", -2.9267394020670396)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.908720896564361),
("second", -2.908720896564361),
("integer (0..10)day (grain)", -2.3978952727983707),
("integer (0..10)year (grain)", -2.908720896564361),
("<number>\20010/\20491month (grain)", -2.908720896564361),
("integer (0..10)second (grain)", -2.908720896564361),
("day", -2.3978952727983707), ("year", -2.908720896564361),
("integer (0..10)minute (grain)", -2.908720896564361),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.908720896564361),
("month", -2.908720896564361), ("minute", -2.908720896564361)],
n = 20},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\24527\24724\33410",
Classifier{okData =
@ -1281,11 +1354,11 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("number suffix: \21313|\25342",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -3.0910424533583156,
likelihoods = HashMap.fromList [("", 0.0)], n = 20},
ClassData{prior = -0.18924199963852842,
unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -1.6094379124341003,
ClassData{prior = -1.7578579175523736,
unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5}}),
("\22320\29699\19968\23567\26102",
@ -1322,11 +1395,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("<number>\20010/\20491",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.4339872044851463,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)], n = 29},
ClassData{prior = -0.2006706954621511,
unseen = -3.4011973816621555,
likelihoods =
HashMap.fromList [("integer (0..10)", -3.509131981127006e-2)],
n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -1.7047480922384253,
unseen = -2.1972245773362196,
likelihoods =
HashMap.fromList
[("one point 2", -0.9808292530117262),
("integer (0..10)", -0.4700036292457356)],
n = 6}}),
("\24773\20154\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,

View File

@ -35,6 +35,20 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of 5 minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.332204510175204,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer (0..10)",
-0.8979415932059586),
("hour", -0.7308875085427924),
("<integer> (latent time-of-day)<number>\20010/\20491",
-2.1972245773362196)],
n = 12},
koData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [], n = 0}}),
("\21360\24230\20016\25910\33410\31532\22235\22825",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
@ -64,11 +78,11 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("integer (numeric)",
Classifier{okData =
ClassData{prior = -0.535142931416697, unseen = -4.204692619390966,
ClassData{prior = -0.621403275701104, unseen = -4.204692619390966,
likelihoods = HashMap.fromList [("", 0.0)], n = 65},
koData =
ClassData{prior = -0.8808888048232392, unseen = -3.871201010907891,
likelihoods = HashMap.fromList [("", 0.0)], n = 46}}),
ClassData{prior = -0.7704388548615918, unseen = -4.060443010546419,
likelihoods = HashMap.fromList [("", 0.0)], n = 56}}),
("\21355\22622\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -145,29 +159,29 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("month (grain)",
Classifier{okData =
ClassData{prior = -1.0541605260972757,
ClassData{prior = -1.0840134892469568,
unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
koData =
ClassData{prior = -0.42845462633286313,
unseen = -3.8066624897703196,
likelihoods = HashMap.fromList [("", 0.0)], n = 43}}),
ClassData{prior = -0.41284521540578695,
unseen = -3.8501476017100584,
likelihoods = HashMap.fromList [("", 0.0)], n = 45}}),
("<time-of-day> o'clock",
Classifier{okData =
ClassData{prior = -0.4418327522790392, unseen = -3.044522437723423,
ClassData{prior = -1.2367626271489267, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.0296194171811581,
unseen = -2.5649493574615367,
ClassData{prior = -0.3429447511268303,
unseen = -3.8501476017100584,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.6931471805599453),
("hour", -0.6931471805599453)],
n = 5}}),
n = 22}}),
("Wednesday",
Classifier{okData =
ClassData{prior = -5.715841383994864e-2,
@ -216,71 +230,73 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("intersect",
Classifier{okData =
ClassData{prior = -0.39204208777602373,
unseen = -5.198497031265826,
ClassData{prior = -0.3968813644167729, unseen = -5.247024072160486,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-3.58351893845611),
-3.632309102625542),
("year (numeric with year symbol)\20809\26126\33410",
-3.1135153092103742),
-3.1623054733798064),
("xxxx year<named-month> <day-of-month>", -3.855452653939752),
("year (numeric with year symbol)\25995\26376",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\20061\22812\33410",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)<named-month> <day-of-month>",
-2.3597435068339943),
-2.4085336710034264),
("year (numeric with year symbol)\22320\29699\19968\23567\26102",
-4.0943445622221),
("dayday", -2.4849066497880004),
("hourhour", -3.58351893845611),
("hourminute", -3.58351893845611),
-4.143134726391533),
("dayday", -2.5336968139574325),
("hourhour", -3.632309102625542),
("hourminute", -3.632309102625542),
("absorption of , after named day<named-month> <day-of-month>",
-2.4849066497880004),
-2.5336968139574325),
("year (numeric with year symbol)\22823\25995\26399",
-3.8066624897703196),
-3.855452653939752),
("year (numeric with year symbol)\22235\26092\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\20303\26842\33410",
-4.0943445622221),
("dayminute", -3.58351893845611),
("tonight<time-of-day> o'clock", -3.58351893845611),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.58351893845611),
("yearday", -1.3217558399823195),
-4.143134726391533),
("dayminute", -3.632309102625542),
("tonight<time-of-day> o'clock", -3.632309102625542),
("yearday", -1.3099213823353166),
("year (numeric with year symbol)\19971\19971\33410",
-3.1135153092103742),
-3.1623054733798064),
("year (numeric with year symbol)\36926\36234\33410",
-4.0943445622221),
-4.143134726391533),
("year (numeric with year symbol)\29369\22826\26032\24180",
-4.0943445622221),
("yearminute", -4.0943445622221)],
n = 75},
-4.143134726391533),
("yearminute", -4.143134726391533),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.632309102625542)],
n = 78},
koData =
ClassData{prior = -1.126011262856224, unseen = -4.634728988229636,
ClassData{prior = -1.1160040313799788, unseen = -4.700480365792417,
likelihoods =
HashMap.fromList
[("\20799\31461\33410<part-of-day> <dim time>",
-2.4277482359480516),
("dayhour", -3.0155349008501706),
("daymonth", -2.5455312716044354),
-2.4941233048929243),
("dayhour", -3.0819099697950434),
("daymonth", -2.6119063405493077),
("year (numeric with year symbol)February",
-3.0155349008501706),
("year (numeric with year symbol)Sunday", -3.9318256327243257),
-3.0819099697950434),
("year (numeric with year symbol)Sunday", -3.9982007016691985),
("<dim time> <part-of-day><time-of-day> o'clock",
-3.5263605246161616),
("year (numeric with year symbol)April", -3.5263605246161616),
("hourhour", -3.5263605246161616),
("year (numeric with year symbol)March", -2.4277482359480516),
("hourminute", -3.0155349008501706),
("yearmonth", -1.916922612182061),
("dayminute", -3.0155349008501706),
("<dim time> <part-of-day>relative minutes after|past <integer> (hour-of-day)",
-3.0155349008501706),
("yearday", -3.9318256327243257),
-3.592735593561034),
("year (numeric with year symbol)April", -3.592735593561034),
("hourhour", -3.592735593561034),
("xxxx yearFebruary", -3.9982007016691985),
("year (numeric with year symbol)March", -2.4941233048929243),
("hourminute", -3.0819099697950434),
("yearmonth", -1.8581345381729275),
("dayminute", -3.0819099697950434),
("xxxx yearMarch", -3.9982007016691985),
("yearday", -3.9982007016691985),
("absorption of , after named dayFebruary",
-2.5455312716044354)],
n = 36}}),
-2.6119063405493077),
("<dim time> <part-of-day>relative (10-59) minutes after|past <integer> (hour-of-day)",
-3.0819099697950434)],
n = 38}}),
("\20399\20029\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
@ -290,12 +306,13 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("year (grain)",
Classifier{okData =
ClassData{prior = -1.6625477377480489,
ClassData{prior = -1.6964492894237302,
unseen = -2.5649493574615367,
likelihoods = HashMap.fromList [("", 0.0)], n = 11},
koData =
ClassData{prior = -0.2102954088363608, unseen = -3.891820298110627,
likelihoods = HashMap.fromList [("", 0.0)], n = 47}}),
ClassData{prior = -0.2025242641114741,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("Saturday",
Classifier{okData =
ClassData{prior = -0.8754687373538999,
@ -451,26 +468,39 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 3}}),
("hh:mm (time-of-day)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5},
ClassData{prior = 0.0, unseen = -2.4849066497880004,
likelihoods = HashMap.fromList [("", 0.0)], n = 10},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
("relative (1-9) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -2.9444389791664407,
ClassData{prior = 0.0, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("integer (numeric)", -1.2809338454620642),
("integer (0..10)", -0.325422400434628)],
n = 16},
[("<integer> (latent time-of-day)integer (0..10)",
-0.6931471805599453),
("hour", -0.6931471805599453)],
n = 9},
koData =
ClassData{prior = -1.6094379124341003,
unseen = -1.9459101490553135,
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
("<integer> (latent time-of-day)",
Classifier{okData =
ClassData{prior = -0.3101549283038396,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList [("integer (numeric)", -0.1823215567939546)],
n = 4}}),
HashMap.fromList
[("integer (numeric)", -1.9740810260220096),
("integer (0..10)", -0.1823215567939546)],
n = 33},
koData =
ClassData{prior = -1.3217558399823195, unseen = -2.772588722239781,
likelihoods =
HashMap.fromList
[("integer (numeric)", -0.5108256237659907),
("one point 2", -1.0986122886681098)],
n = 12}}),
("\36926\36234\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -534,6 +564,26 @@ classifiers
ClassData{prior = -0.5625269981428811,
unseen = -3.9318256327243257,
likelihoods = HashMap.fromList [("", 0.0)], n = 49}}),
("relative (10-59) minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.5465437063680699, unseen = -3.891820298110627,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7357067949787413),
("hour", -0.7357067949787413)],
n = 22},
koData =
ClassData{prior = -0.8649974374866046,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.750305594399894)],
n = 16}}),
("year (numeric with year symbol)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.891820298110627,
@ -664,8 +714,8 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 1}}),
("afternoon",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods = HashMap.fromList [("", 0.0)], n = 9},
ClassData{prior = 0.0, unseen = -3.367295829986474,
likelihoods = HashMap.fromList [("", 0.0)], n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -692,8 +742,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("February",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.2188758248682006,
likelihoods = HashMap.fromList [("", 0.0)], n = 23},
ClassData{prior = 0.0, unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -718,8 +768,20 @@ classifiers
n = 23}}),
("minute (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.890371757896165,
ClassData{prior = -0.3184537311185346, unseen = -2.890371757896165,
likelihoods = HashMap.fromList [("", 0.0)], n = 16},
koData =
ClassData{prior = -1.2992829841302609,
unseen = -2.0794415416798357,
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("xxxx year",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)integer (0..10)integer (0..10)",
0.0)],
n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -739,62 +801,66 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<part-of-day> <dim time>",
Classifier{okData =
ClassData{prior = -0.6097655716208943, unseen = -4.07753744390572,
ClassData{prior = -0.7507762933965817, unseen = -4.859812404361672,
likelihoods =
HashMap.fromList
[("tonight<integer> (latent time-of-day)", -2.451005098112319),
("hourhour", -1.3523928094442093),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.6625477377480489),
("afternoon<time-of-day> o'clock", -2.6741486494265287),
("hourminute", -1.575536360758419),
[("tonight<integer> (latent time-of-day)", -3.242592351485517),
("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-1.7165360479904674),
("hourhour", -2.1439800628174073),
("afternoon<time-of-day> o'clock", -3.4657359027997265),
("hourminute", -1.0233888674305223),
("afternoon<integer> (latent time-of-day)",
-2.6741486494265287),
("afternoonhh:mm (time-of-day)", -3.367295829986474),
("tonight<time-of-day> o'clock", -2.451005098112319)],
n = 25},
-3.4657359027997265),
("afternoonrelative (1-9) minutes after|past <integer> (hour-of-day)",
-2.5494451709255714),
("afternoonhh:mm (time-of-day)", -3.7534179752515073),
("tonight<time-of-day> o'clock", -3.242592351485517),
("afternoonnumber of 5 minutes after|past <integer> (hour-of-day)",
-2.2870809064580806)],
n = 59},
koData =
ClassData{prior = -0.7841189587656721,
unseen = -3.9318256327243257,
ClassData{prior = -0.6386589952758756, unseen = -4.962844630259907,
likelihoods =
HashMap.fromList
[("hourhour", -1.4271163556401458),
("afternoonrelative minutes after|past <integer> (hour-of-day)",
-1.5141277326297755),
("afternoon<time-of-day> o'clock", -2.120263536200091),
("hourminute", -1.5141277326297755),
[("afternoonrelative (10-59) minutes after|past <integer> (hour-of-day)",
-2.1226137135450447),
("hourhour", -1.024001424876935),
("afternoon<time-of-day> o'clock", -1.820332841672111),
("hourminute", -2.1226137135450447),
("afternoon<integer> (latent time-of-day)",
-1.9661128563728327)],
n = 21}}),
-1.5885312276147867)],
n = 66}}),
("<integer> <unit-of-duration>",
Classifier{okData =
ClassData{prior = -infinity, unseen = -3.044522437723423,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -6.12029741895095,
ClassData{prior = 0.0, unseen = -6.18826412308259,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342month (grain)",
-4.508659285607248),
("week", -2.8992213731731473),
("integer (0..10)month (grain)", -2.7168998163791924),
("integer (0..10)hour (grain)", -3.1736582188749076),
("<number>\20010/\20491week (grain)", -3.720201925242977),
("second", -3.4790398684260895),
("integer (0..10)day (grain)", -2.982602982112198),
("integer (0..10)year (grain)", -3.8155121050473024),
("<number>\20010/\20491month (grain)", -3.3455084758015667),
("integer (numeric)year (grain)", -2.246896187133457),
("integer (0..10)second (grain)", -3.4790398684260895),
("day", -2.982602982112198), ("year", -2.0750459302067976),
("integer (0..10)minute (grain)", -3.2848838539851317),
("hour", -2.982602982112198),
("integer (0..10)week (grain)", -3.410046996939138),
("month", -1.9437099281457109),
("<number>\20010/\20491hour (grain)", -4.508659285607248),
("integer (numeric)month (grain)", -3.2848838539851317),
("minute", -3.2848838539851317)],
n = 217}}),
-4.576770711466393),
("week", -2.967332799032293),
("integer (0..10)month (grain)", -2.720472721100767),
("integer (0..10)hour (grain)", -3.050714407971344),
("<number>\20010/\20491week (grain)", -3.788313351102123),
("second", -3.5471512942852352),
("integer (0..10)day (grain)", -3.050714407971344),
("integer (0..10)year (grain)", -3.7013019741124937),
("<number>\20010/\20491month (grain)", -3.4136199016607125),
("integer (numeric)year (grain)", -2.315007612992603),
("integer (0..10)second (grain)", -3.5471512942852352),
("day", -3.050714407971344), ("year", -2.1086711799947744),
("integer (0..10)minute (grain)", -3.050714407971344),
("hour", -3.050714407971344),
("integer (0..10)week (grain)", -3.4781584227982836),
("month", -1.9815160045095277),
("integer (numeric)month (grain)", -3.3529952798442775),
("integer with consecutive unit modifiersminute (grain)",
-4.24029847484518),
("minute", -2.81891279391402)],
n = 233}}),
("\32769\26495\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
@ -811,56 +877,35 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("<time-of-day> am|pm",
Classifier{okData =
ClassData{prior = -0.4700036292457356, unseen = -2.70805020110221,
ClassData{prior = -0.5596157879354228, unseen = -3.044522437723423,
likelihoods =
HashMap.fromList
[("hh:mm (time-of-day)", -1.252762968495368),
("<integer> (latent time-of-day)", -1.540445040947149),
("hour", -1.540445040947149), ("minute", -1.252762968495368)],
n = 5},
[("hh:mm (time-of-day)", -1.0498221244986778),
("<integer> (latent time-of-day)", -1.8971199848858813),
("hour", -1.8971199848858813), ("minute", -1.0498221244986778)],
n = 8},
koData =
ClassData{prior = -0.9808292530117262,
unseen = -2.3978952727983707,
ClassData{prior = -0.8472978603872037, unseen = -2.833213344056216,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)", -0.916290731874155),
("hour", -0.916290731874155)],
n = 3}}),
("relative minutes after|past <integer> (hour-of-day)",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)integer with consecutive unit modifiers",
-0.7801585575495751),
("hour", -0.7801585575495751)],
n = 10},
koData =
ClassData{prior = -0.6931471805599453,
unseen = -3.2188758248682006,
likelihoods =
HashMap.fromList
[("<integer> (latent time-of-day)number suffix: \21313|\25342",
-1.3862943611198906),
("<integer> (latent time-of-day)integer (0..10)",
-1.3862943611198906),
("hour", -0.7801585575495751)],
n = 10}}),
[("<integer> (latent time-of-day)", -0.8266785731844679),
("hour", -0.8266785731844679)],
n = 6}}),
("one point 2",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.3862943611198906,
ClassData{prior = -infinity, unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
ClassData{prior = 0.0, unseen = -3.5553480614894135,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -1.3217558399823195),
[("integer (0..10)integer (0..10)", -0.8873031950009028),
("integer (0..10)number suffix: \21313|\25342",
-1.3217558399823195),
-1.7346010553881064),
("integer (0..10)integer with consecutive unit modifiers",
-0.7621400520468967)],
n = 12}}),
-1.128465251817791),
("integer (0..10)<number>\20010/\20491", -2.4277482359480516)],
n = 30}}),
("intersect by \",\"",
Classifier{okData =
ClassData{prior = -0.40546510810816444,
@ -894,16 +939,20 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("integer with consecutive unit modifiers",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.367295829986474,
ClassData{prior = -5.715841383994864e-2,
unseen = -3.6109179126442243,
likelihoods =
HashMap.fromList
[("number suffix: \21313|\25342integer (0..10)",
-0.6931471805599453),
("integer (0..10)integer (0..10)", -0.6931471805599453)],
n = 26},
n = 34},
koData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -2.890371757896165, unseen = -1.6094379124341003,
likelihoods =
HashMap.fromList
[("integer (0..10)integer (0..10)", -0.2876820724517809)],
n = 2}}),
("second (grain)",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.70805020110221,
@ -967,8 +1016,8 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("March",
Classifier{okData =
ClassData{prior = 0.0, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [("", 0.0)], n = 14},
ClassData{prior = 0.0, unseen = -2.833213344056216,
likelihoods = HashMap.fromList [("", 0.0)], n = 15},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
@ -981,11 +1030,12 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("the day after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.6094379124341003,
ClassData{prior = -0.5108256237659907,
unseen = -1.6094379124341003,
likelihoods = HashMap.fromList [("", 0.0)], n = 3},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -0.916290731874155, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2}}),
("\22307\21608\20845",
Classifier{okData =
ClassData{prior = -0.6931471805599453,
@ -1066,27 +1116,25 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("next n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.61512051684126,
ClassData{prior = 0.0, unseen = -4.605170185988091,
likelihoods =
HashMap.fromList
[("week", -2.4079456086518722),
("integer (0..10)hour (grain)", -2.659260036932778),
("<number>\20010/\20491week (grain)", -2.995732273553991),
("second", -2.8134107167600364),
("integer (0..10)day (grain)", -2.5257286443082556),
("integer (0..10)year (grain)", -3.2188758248682006),
("<number>\20010/\20491month (grain)", -2.8134107167600364),
("integer (0..10)second (grain)", -2.8134107167600364),
("day", -2.5257286443082556), ("year", -3.2188758248682006),
("integer (0..10)minute (grain)", -2.659260036932778),
("hour", -2.4079456086518722),
("integer (0..10)week (grain)", -2.995732273553991),
("month", -2.8134107167600364),
("<number>\20010/\20491hour (grain)", -3.506557897319982),
("minute", -2.659260036932778)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.9856819377004897),
("second", -2.803360380906535),
("integer (0..10)day (grain)", -2.515678308454754),
("integer (0..10)year (grain)", -3.2088254890146994),
("<number>\20010/\20491month (grain)", -2.803360380906535),
("integer (0..10)second (grain)", -2.803360380906535),
("day", -2.515678308454754), ("year", -3.2088254890146994),
("integer (0..10)minute (grain)", -2.649209701079277),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.9856819377004897),
("month", -2.803360380906535), ("minute", -2.649209701079277)],
n = 42},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\19975\22307\33410",
Classifier{okData =
@ -1102,6 +1150,14 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number of five minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)],
n = 2}}),
("\20799\31461\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,
@ -1124,6 +1180,18 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("number.number minutes",
Classifier{okData =
ClassData{prior = -infinity, unseen = -1.0986122886681098,
likelihoods = HashMap.fromList [], n = 0},
koData =
ClassData{prior = 0.0, unseen = -2.3978952727983707,
likelihoods =
HashMap.fromList
[("integer (0..10)integer with consecutive unit modifiersminute (grain)",
-0.6931471805599453),
("minute", -0.6931471805599453)],
n = 4}}),
("\32822\31267\21463\38590\26085",
Classifier{okData =
ClassData{prior = -1.0296194171811581,
@ -1135,19 +1203,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 9}}),
("<named-month> <day-of-month>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.709530201312334,
ClassData{prior = 0.0, unseen = -4.762173934797756,
likelihoods =
HashMap.fromList
[("Marchinteger (0..10)", -2.6210388241125804),
("Marchinteger (numeric)", -3.0910424533583156),
("Aprilinteger (numeric)", -3.6018680771243066),
("Februaryinteger (0..10)", -2.6210388241125804),
("Februarynumber suffix: \21313|\25342", -2.6210388241125804),
("month", -0.7492366472109889),
("Februaryinteger (numeric)", -2.503255788456197),
[("Marchinteger (0..10)", -2.5563656137701454),
("Marchinteger (numeric)", -3.144152278672264),
("Aprilinteger (numeric)", -3.654977902438255),
("Februaryinteger (0..10)", -2.6741486494265287),
("Februarynumber suffix: \21313|\25342", -2.6741486494265287),
("month", -0.7462570058738938),
("Februaryinteger (numeric)", -2.5563656137701454),
("Februaryinteger with consecutive unit modifiers",
-1.8672670217362002)],
n = 51},
-1.8091512119399242)],
n = 54},
koData =
ClassData{prior = -infinity, unseen = -2.1972245773362196,
likelihoods = HashMap.fromList [], n = 0}}),
@ -1181,14 +1249,21 @@ classifiers
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("two days after tomorrow",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.3862943611198906,
likelihoods = HashMap.fromList [("", 0.0)], n = 2},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
("integer (0..10)",
Classifier{okData =
ClassData{prior = -0.7055697005585025,
unseen = -5.0875963352323845,
likelihoods = HashMap.fromList [("", 0.0)], n = 160},
ClassData{prior = -0.6026331730191135,
unseen = -5.3471075307174685,
likelihoods = HashMap.fromList [("", 0.0)], n = 208},
koData =
ClassData{prior = -0.680877087968131, unseen = -5.111987788356543,
likelihoods = HashMap.fromList [("", 0.0)], n = 164}}),
ClassData{prior = -0.7926767759069784, unseen = -5.159055299214529,
likelihoods = HashMap.fromList [("", 0.0)], n = 172}}),
("last n <cycle>",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.605170185988091,
@ -1226,27 +1301,25 @@ classifiers
n = 10}}),
("n <cycle> last",
Classifier{okData =
ClassData{prior = 0.0, unseen = -4.04305126783455,
ClassData{prior = 0.0, unseen = -4.02535169073515,
likelihoods =
HashMap.fromList
[("week", -2.4159137783010487),
("integer (0..10)hour (grain)", -2.9267394020670396),
("<number>\20010/\20491week (grain)", -2.9267394020670396),
("second", -2.9267394020670396),
("integer (0..10)day (grain)", -2.4159137783010487),
("integer (0..10)year (grain)", -2.9267394020670396),
("<number>\20010/\20491month (grain)", -2.9267394020670396),
("integer (0..10)second (grain)", -2.9267394020670396),
("day", -2.4159137783010487), ("year", -2.9267394020670396),
("integer (0..10)minute (grain)", -2.9267394020670396),
("hour", -2.4159137783010487),
("integer (0..10)week (grain)", -2.9267394020670396),
("month", -2.9267394020670396),
("<number>\20010/\20491hour (grain)", -2.9267394020670396),
("minute", -2.9267394020670396)],
[("week", -2.3978952727983707),
("integer (0..10)hour (grain)", -2.3978952727983707),
("<number>\20010/\20491week (grain)", -2.908720896564361),
("second", -2.908720896564361),
("integer (0..10)day (grain)", -2.3978952727983707),
("integer (0..10)year (grain)", -2.908720896564361),
("<number>\20010/\20491month (grain)", -2.908720896564361),
("integer (0..10)second (grain)", -2.908720896564361),
("day", -2.3978952727983707), ("year", -2.908720896564361),
("integer (0..10)minute (grain)", -2.908720896564361),
("hour", -2.3978952727983707),
("integer (0..10)week (grain)", -2.908720896564361),
("month", -2.908720896564361), ("minute", -2.908720896564361)],
n = 20},
koData =
ClassData{prior = -infinity, unseen = -2.833213344056216,
ClassData{prior = -infinity, unseen = -2.772588722239781,
likelihoods = HashMap.fromList [], n = 0}}),
("\24527\24724\33410",
Classifier{okData =
@ -1271,11 +1344,11 @@ classifiers
likelihoods = HashMap.fromList [], n = 0}}),
("number suffix: \21313|\25342",
Classifier{okData =
ClassData{prior = -0.2231435513142097,
unseen = -3.0910424533583156,
likelihoods = HashMap.fromList [("", 0.0)], n = 20},
ClassData{prior = -0.18924199963852842,
unseen = -3.258096538021482,
likelihoods = HashMap.fromList [("", 0.0)], n = 24},
koData =
ClassData{prior = -1.6094379124341003,
ClassData{prior = -1.7578579175523736,
unseen = -1.9459101490553135,
likelihoods = HashMap.fromList [("", 0.0)], n = 5}}),
("\22320\29699\19968\23567\26102",
@ -1312,11 +1385,19 @@ classifiers
likelihoods = HashMap.fromList [("", 0.0)], n = 6}}),
("<number>\20010/\20491",
Classifier{okData =
ClassData{prior = 0.0, unseen = -3.4339872044851463,
likelihoods = HashMap.fromList [("integer (0..10)", 0.0)], n = 29},
ClassData{prior = -0.2006706954621511,
unseen = -3.4011973816621555,
likelihoods =
HashMap.fromList [("integer (0..10)", -3.509131981127006e-2)],
n = 27},
koData =
ClassData{prior = -infinity, unseen = -0.6931471805599453,
likelihoods = HashMap.fromList [], n = 0}}),
ClassData{prior = -1.7047480922384253,
unseen = -2.1972245773362196,
likelihoods =
HashMap.fromList
[("one point 2", -0.9808292530117262),
("integer (0..10)", -0.4700036292457356)],
n = 6}}),
("\24773\20154\33410",
Classifier{okData =
ClassData{prior = 0.0, unseen = -1.9459101490553135,

View File

@ -19,6 +19,7 @@ import Duckling.Locale
import Duckling.Types
import qualified Duckling.AmountOfMoney.ZH.Rules as AmountOfMoney
import qualified Duckling.Distance.ZH.Rules as Distance
import qualified Duckling.Duration.ZH.Rules as Duration
import qualified Duckling.Numeral.ZH.Rules as Numeral
import qualified Duckling.Ordinal.ZH.Rules as Ordinal
import qualified Duckling.Quantity.ZH.Rules as Quantity
@ -45,7 +46,7 @@ langRules :: Seal Dimension -> [Rule]
langRules (Seal AmountOfMoney) = AmountOfMoney.rules
langRules (Seal CreditCardNumber) = []
langRules (Seal Distance) = Distance.rules
langRules (Seal Duration) = []
langRules (Seal Duration) = Duration.rules
langRules (Seal Email) = []
langRules (Seal Numeral) = Numeral.rules
langRules (Seal Ordinal) = Ordinal.rules

View File

@ -60,6 +60,10 @@ allExamples = concat
, "後天"
, "後日"
]
, examples (datetime (2013, 2, 15, 0, 0, 0) Day)
[ "大後日"
, "大後天"
]
, examples (datetime (2013, 2, 10, 0, 0, 0) Day)
[ "前天"
, "前日"
@ -177,6 +181,7 @@ allExamples = concat
, "3/3/15"
, "2015-3-3"
, "2015-03-03"
, "二零一五年三月三號"
]
, examples (datetime (2013, 2, 15, 0, 0, 0) Day)
[ "2013年2月15号"
@ -188,6 +193,7 @@ allExamples = concat
, "2月15號"
, "二月十五號"
, "2/15"
, "二零一三年二月十五號"
]
, examples (datetime (1974, 10, 31, 0, 0, 0) Day)
[ "10/31/1974"
@ -449,6 +455,30 @@ allExamples = concat
, "3:15p"
, "下午三點十五"
, "晏晝三點十五"
, "下午三点十五分"
, "下午三點十五分"
, "晏晝三點十五分"
, "晏晝三點三"
, "晏晝三點踏三"
, "晏晝三點搭三"
, "晏晝三點三個字"
]
, examples (datetime (2013, 2, 12, 15, 05, 0) Minute)
[ "下午三点零五"
, "下午3:05"
, "15:05"
, "3:05pm"
, "3:05PM"
, "3:05p"
, "下午三點零五"
, "晏晝三點零五"
, "下午三点零五分"
, "下午三點零五分"
, "晏晝三點零五分"
, "晏晝三點一"
, "晏晝三點踏一"
, "晏晝三點搭一"
, "晏晝三點一個字"
]
, examples (datetime (2013, 2, 12, 13, 0, 0) Minute)
[ "4pm CET"

View File

@ -19,6 +19,7 @@ import qualified Data.Text as Text
import Duckling.Dimensions.Types
import Duckling.Numeral.Helpers (parseInt)
import Duckling.Numeral.Types (NumeralData(..))
import Duckling.Regex.Types
import Duckling.Time.Computed
import Duckling.Time.Helpers
@ -27,6 +28,7 @@ import Duckling.Types
import qualified Duckling.Ordinal.Types as TOrdinal
import qualified Duckling.Time.Types as TTime
import qualified Duckling.TimeGrain.Types as TG
import qualified Duckling.Numeral.Types as TNumeral
ruleTheDayAfterTomorrow :: Rule
ruleTheDayAfterTomorrow = Rule
@ -37,6 +39,15 @@ ruleTheDayAfterTomorrow = Rule
, prod = \_ -> tt $ cycleNth TG.Day 2
}
ruleTwoDaysAfterTomorrow :: Rule
ruleTwoDaysAfterTomorrow = Rule
{ name = "two days after tomorrow"
, pattern =
[ regex "大后天|大後天|大後日"
]
, prod = \_ -> tt $ cycleNth TG.Day 3
}
ruleRelativeMinutesTotillbeforeIntegerHourofday :: Rule
ruleRelativeMinutesTotillbeforeIntegerHourofday = Rule
{ name = "relative minutes to|till|before <integer> (hour-of-day)"
@ -69,11 +80,11 @@ ruleRelativeMinutesTotillbeforeNoonmidnight = Rule
ruleRelativeMinutesAfterpastIntegerHourofday :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday = Rule
{ name = "relative minutes after|past <integer> (hour-of-day)"
{ name = "relative (10-59) minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点|點"
, Predicate $ isIntegerBetween 1 59
, Predicate $ isIntegerBetween 10 59
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
@ -85,6 +96,117 @@ ruleRelativeMinutesAfterpastIntegerHourofday = Rule
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday2 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday2 = Rule
{ name = "relative (10-59) minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点|點"
, Predicate $ isIntegerBetween 10 59
, regex ""
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours n
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday3 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday3 = Rule
{ name = "relative (1-9) minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点零|點零"
, Predicate $ isIntegerBetween 1 9
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours n
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday4 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday4 = Rule
{ name = "relative (1-9) minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点零|點零"
, Predicate $ isIntegerBetween 1 9
, regex ""
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours n
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday5 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday5 = Rule
{ name = "number of 5 minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点踏|點踏|点搭|點搭"
, Predicate $ isIntegerBetween 1 11
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours (5*n)
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday6 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday6 = Rule
{ name = "number of 5 minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点|點"
, Predicate $ isIntegerBetween 1 9
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours (5*n)
_ -> Nothing
}
ruleRelativeMinutesAfterpastIntegerHourofday7 :: Rule
ruleRelativeMinutesAfterpastIntegerHourofday7 = Rule
{ name = "number of 5 minutes after|past <integer> (hour-of-day)"
, pattern =
[ Predicate isAnHourOfDay
, regex "点|點"
, Predicate $ isIntegerBetween 1 11
, regex "個字"
]
, prod = \tokens -> case tokens of
(Token Time TimeData {TTime.form = Just (TTime.TimeOfDay (Just hours) _)}:
_:
token:
_) -> do
n <- getIntValue token
tt $ hourMinute True hours (5*n)
_ -> Nothing
}
ruleRelativeMinutesAfterpastNoonmidnight :: Rule
ruleRelativeMinutesAfterpastNoonmidnight = Rule
{ name = "relative minutes after|past noon|midnight"
@ -478,6 +600,27 @@ ruleYearNumericWithYearSymbol = Rule
_ -> Nothing
}
ruleYearNumericWithYearSymbol2 :: Rule
ruleYearNumericWithYearSymbol2 = Rule
{ name = "xxxx year"
, pattern =
[ dimension Numeral
, dimension Numeral
, dimension Numeral
, dimension Numeral
, regex ""
]
, prod = \tokens -> case tokens of
(Token Numeral NumeralData{TNumeral.value = y1}:
Token Numeral NumeralData{TNumeral.value = y2}:
Token Numeral NumeralData{TNumeral.value = y3}:
Token Numeral NumeralData{TNumeral.value = y4}:
_) -> do
let v = floor(y1*1000 + y2*100 + y3*10 + y4)
tt $ year v
_ -> Nothing
}
ruleDurationAgo :: Rule
ruleDurationAgo = Rule
{ name = "<duration> ago"
@ -1154,6 +1297,7 @@ rules =
, ruleTheCycleAfterTime
, ruleTheCycleBeforeTime
, ruleTheDayAfterTomorrow
, ruleTwoDaysAfterTomorrow
, ruleTheDayBeforeYesterday
, ruleThisCycle
, ruleThisDayofweek
@ -1168,9 +1312,16 @@ rules =
, ruleTonight
, ruleWeekend
, ruleYearNumericWithYearSymbol
, ruleYearNumericWithYearSymbol2
, ruleYesterday
, ruleYyyymmdd
, ruleTimezone
, ruleRelativeMinutesAfterpastIntegerHourofday2
, ruleRelativeMinutesAfterpastIntegerHourofday3
, ruleRelativeMinutesAfterpastIntegerHourofday4
, ruleRelativeMinutesAfterpastIntegerHourofday5
, ruleRelativeMinutesAfterpastIntegerHourofday6
, ruleRelativeMinutesAfterpastIntegerHourofday7
]
++ ruleDaysOfWeek
++ ruleMonths

View File

@ -23,7 +23,7 @@ grains :: [(Text, String, TG.Grain)]
grains = [ ("second (grain)", "秒(钟|鐘)?", TG.Second)
, ("minute (grain)", "分(钟|鐘)?", TG.Minute)
, ("hour (grain)",
"小时|小時|鐘(\x982d)?", TG.Hour)
"小时|小時|個鐘|鐘(\x982d)?", TG.Hour)
, ("day (grain)", "天|日", TG.Day)
, ("week (grain)",
"周|週|礼拜|禮拜|星期", TG.Week)

View File

@ -378,6 +378,7 @@ library
, Duckling.Duration.UK.Corpus
, Duckling.Duration.UK.Rules
, Duckling.Duration.ZH.Corpus
, Duckling.Duration.ZH.Rules
, Duckling.Duration.Helpers
, Duckling.Duration.Rules
, Duckling.Duration.Types