Use a different set of benchmarks (#177)

This commit is contained in:
Mark Karpov 2017-01-29 03:30:16 +04:00 committed by GitHub
parent e63ac94df0
commit 1f58aa939f
5 changed files with 210 additions and 203 deletions

93
bench-memory/Main.hs Normal file
View File

@ -0,0 +1,93 @@
--
-- Weigh benchmarks for Megaparsec.
--
-- Copyright © 20152017 Megaparsec contributors
--
-- Redistribution and use in source and binary forms, with or without
-- modification, are permitted provided that the following conditions are
-- met:
--
-- * Redistributions of source code must retain the above copyright notice,
-- this list of conditions and the following disclaimer.
--
-- * Redistributions in binary form must reproduce the above copyright
-- notice, this list of conditions and the following disclaimer in the
-- documentation and/or other materials provided with the distribution.
--
-- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS “AS IS” AND ANY
-- EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-- WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-- DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY
-- DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-- DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
-- OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-- HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
-- STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
-- ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
-- POSSIBILITY OF SUCH DAMAGE.
module Main (main) where
import Control.DeepSeq
import Control.Monad
import Text.Megaparsec
import Text.Megaparsec.String
import Weigh
main :: IO ()
main = mainWith $ do
bparser "string" manyAs (string . fst)
bparser "string'" manyAs (string' . fst)
bparser "choice" (const "b") (choice . fmap char . manyAsB . snd)
bparser "many" manyAs (const $ many (char 'a'))
bparser "some" manyAs (const $ some (char 'a'))
bparser "count" manyAs (\(_,n) -> count n (char 'a'))
bparser "count'" manyAs (\(_,n) -> count' 1 n (char 'a'))
bparser "endBy" manyAbs' (const $ endBy (char 'a') (char 'b'))
bparser "endBy1" manyAbs' (const $ endBy1 (char 'a') (char 'b'))
bparser "sepBy" manyAbs (const $ sepBy (char 'a') (char 'b'))
bparser "sepBy1" manyAbs (const $ sepBy1 (char 'a') (char 'b'))
bparser "sepEndBy" manyAbs' (const $ sepEndBy (char 'a') (char 'b'))
bparser "sepEndBy1" manyAbs' (const $ sepEndBy1 (char 'a') (char 'b'))
bparser "manyTill" manyAsB (const $ manyTill (char 'a') (char 'b'))
bparser "someTill" manyAsB (const $ someTill (char 'a') (char 'b'))
-- | Perform a series of measurements with the same parser.
bparser :: NFData a
=> String -- ^ Name of the benchmark group
-> (Int -> String) -- ^ How to construct input
-> ((String, Int) -> Parser a) -- ^ The parser receiving its future input
-> Weigh ()
bparser name f p = forM_ stdSeries $ \i -> do
let arg = (f i,i)
p' (s,n) = parse (p (s,n)) "" s
func (name ++ "/" ++ show i) p' arg
-- | The series of sizes to try as part of 'bparser'.
stdSeries :: [Int]
stdSeries = [500,1000,2000,4000]
----------------------------------------------------------------------------
-- Helpers
-- | Generate that many \'a\' characters.
manyAs :: Int -> String
manyAs n = replicate n 'a'
-- | Like 'manyAs', but interspersed with \'b\'s.
manyAbs :: Int -> String
manyAbs n = take (if even n then n + 1 else n) (cycle "ab")
-- | Like 'manyAs', but with a \'b\' added to the end.
manyAsB :: Int -> String
manyAsB n = replicate n 'a' ++ "b"
-- | Like 'manyAbs', but ends in a \'b\'.
manyAbs' :: Int -> String
manyAbs' n = take (if even n then n else n + 1) (cycle "ab")

93
bench-speed/Main.hs Normal file
View File

@ -0,0 +1,93 @@
--
-- Criterion benchmarks for Megaparsec.
--
-- Copyright © 20152017 Megaparsec contributors
--
-- Redistribution and use in source and binary forms, with or without
-- modification, are permitted provided that the following conditions are
-- met:
--
-- * Redistributions of source code must retain the above copyright notice,
-- this list of conditions and the following disclaimer.
--
-- * Redistributions in binary form must reproduce the above copyright
-- notice, this list of conditions and the following disclaimer in the
-- documentation and/or other materials provided with the distribution.
--
-- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS “AS IS” AND ANY
-- EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-- WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-- DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY
-- DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-- DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
-- OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-- HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
-- STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
-- ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
-- POSSIBILITY OF SUCH DAMAGE.
module Main (main) where
import Control.DeepSeq
import Criterion.Main
import Text.Megaparsec
import Text.Megaparsec.String
main :: IO ()
main = defaultMain
[ bparser "string" manyAs (string . fst)
, bparser "string'" manyAs (string' . fst)
, bparser "choice" (const "b") (choice . fmap char . manyAsB . snd)
, bparser "many" manyAs (const $ many (char 'a'))
, bparser "some" manyAs (const $ some (char 'a'))
, bparser "count" manyAs (\(_,n) -> count n (char 'a'))
, bparser "count'" manyAs (\(_,n) -> count' 1 n (char 'a'))
, bparser "endBy" manyAbs' (const $ endBy (char 'a') (char 'b'))
, bparser "endBy1" manyAbs' (const $ endBy1 (char 'a') (char 'b'))
, bparser "sepBy" manyAbs (const $ sepBy (char 'a') (char 'b'))
, bparser "sepBy1" manyAbs (const $ sepBy1 (char 'a') (char 'b'))
, bparser "sepEndBy" manyAbs' (const $ sepEndBy (char 'a') (char 'b'))
, bparser "sepEndBy1" manyAbs' (const $ sepEndBy1 (char 'a') (char 'b'))
, bparser "manyTill" manyAsB (const $ manyTill (char 'a') (char 'b'))
, bparser "someTill" manyAsB (const $ someTill (char 'a') (char 'b'))
]
-- | Perform a series to measurements with the same parser.
bparser :: NFData a
=> String -- ^ Name of the benchmark group
-> (Int -> String) -- ^ How to construct input
-> ((String, Int) -> Parser a) -- ^ The parser receiving its future input
-> Benchmark -- ^ The benchmark
bparser name f p = bgroup name (bs <$> stdSeries)
where
bs n = env (return (f n, n)) (bench (show n) . nf p')
p' (s,n) = parse (p (s,n)) "" s
-- | The series of sizes to try as part of 'bparser'.
stdSeries :: [Int]
stdSeries = [500,1000,2000,4000]
----------------------------------------------------------------------------
-- Helpers
-- | Generate that many \'a\' characters.
manyAs :: Int -> String
manyAs n = replicate n 'a'
-- | Like 'manyAs', but with a \'b\' added to the end.
manyAsB :: Int -> String
manyAsB n = replicate n 'a' ++ "b"
-- | Like 'manyAs', but interspersed with \'b\'s and ends in a \'a\'.
manyAbs :: Int -> String
manyAbs n = take (if even n then n + 1 else n) (cycle "ab")
-- | Like 'manyAbs', but ends in a \'b\'.
manyAbs' :: Int -> String
manyAbs' n = take (if even n then n else n + 1) (cycle "ab")

View File

@ -1,192 +0,0 @@
--
-- Criterion benchmarks for Megaparsec.
--
-- Copyright © 20152017 Megaparsec contributors
--
-- Redistribution and use in source and binary forms, with or without
-- modification, are permitted provided that the following conditions are
-- met:
--
-- * Redistributions of source code must retain the above copyright notice,
-- this list of conditions and the following disclaimer.
--
-- * Redistributions in binary form must reproduce the above copyright
-- notice, this list of conditions and the following disclaimer in the
-- documentation and/or other materials provided with the distribution.
--
-- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS “AS IS” AND ANY
-- EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-- WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-- DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY
-- DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-- DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
-- OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-- HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
-- STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
-- ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
-- POSSIBILITY OF SUCH DAMAGE.
{-# LANGUAGE CPP #-}
module Main (main) where
import Criterion.Main
import Text.Megaparsec
-- Configuration parameters.
-- To configure the benchmark, build the benchmarks e.g. like this:
-- $ cabal build --ghc-options="-DBENCHMARK_TYPE=3 -DBENCHMARK_STEPS=10"
-- BENCHMARK_TYPE options:
-- 0: Text.Megaparsec.String
-- 1: Text.Megaparsec.Text
-- 2: Text.Megaparsec.Text.Lazy
-- 3: Text.Megaparsec.ByteString
-- 4: Text.Megaparsec.ByteString.Lazy
#ifndef BENCHMARK_TYPE
#define BENCHMARK_TYPE 0
#endif
#if BENCHMARK_TYPE == 0
import Text.Megaparsec.String (Parser)
pack :: String -> String
pack = id
#endif
#if BENCHMARK_TYPE == 1
import Text.Megaparsec.Text (Parser)
import Data.Text (pack)
#endif
#if BENCHMARK_TYPE == 2
import Text.Megaparsec.Text.Lazy (Parser)
import Data.Text.Lazy (pack)
#endif
#if BENCHMARK_TYPE == 3
import Text.Megaparsec.ByteString (Parser)
import Data.ByteString.Char8 (pack)
#endif
#if BENCHMARK_TYPE == 4
import Text.Megaparsec.ByteString.Lazy (Parser)
import Data.ByteString.Lazy.Char8 (pack)
#endif
-- benchSteps and benchSize control the benchmark test points
benchSteps :: Int
#if BENCHMARK_STEPS
benchSteps = BENCHMARK_STEPS
#else
benchSteps = 5
#endif
benchSize :: Int
#if BENCHMARK_SIZE
benchSize = BENCHMARK_SIZE
#else
benchSize = 1000
#endif
-- End of configuration parameters
main :: IO ()
main = defaultMain benchmarks
benchmarks :: [Benchmark]
benchmarks =
[
-- First the primitives
bgroup "string" $ benchBunch $ \size str ->
parse (string str :: Parser String) ""
(pack $ replicate size 'a')
, bgroup "try-string" $ benchBunch $ \size str ->
parse (try $ string str :: Parser String) ""
(pack $ replicate size 'a')
, bgroup "lookahead-string" $ benchBunch $ \size str ->
parse (lookAhead $ string str :: Parser String) ""
(pack $ replicate size 'a')
, bgroup "notfollowedby-string" $ benchBunch $ \size str ->
parse (notFollowedBy $ string str :: Parser ()) ""
(pack $ replicate size 'a')
, bgroup "manual-string" benchManual
-- Now for a few combinators
-- Major class instance operators: return, >>=, <|>, mzero
-- TODO
-- I'm not really sure how to test these operators since I can't imagine what
-- supraconstant complexity they might have.
-- A few non-primitive combinators follow below
, bgroup "choice"
[ bgroup "match" $ benchBunchMatch $ \size _ ->
parse
(choice (replicate (size-1) (char 'b') ++ [char 'a']) :: Parser Char)
""
(pack $ replicate size 'a')
, bgroup "nomatch" $ benchBunchMatch $ \size _ ->
parse
(choice (replicate size (char 'b')) :: Parser Char)
""
(pack $ replicate size 'a')
]
, bgroup "count'" benchCount
, bgroup "sepBy1" benchSepBy1
, bgroup "manyTill" $ benchBunchNoMatchLate $ \size _ ->
parse
(manyTill (char 'a') (char 'b') :: Parser String)
""
(pack $ replicate (size-1) 'a' ++ "b")
]
benchManual :: [Benchmark]
benchManual =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf
(parse (sequence $ fmap char (replicate num 'a') :: Parser String) "")
(pack $ replicate num 'a')
benchCount :: [Benchmark]
benchCount =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf
(parse (count' size (size*2) (char 'a') :: Parser String) "")
(pack $ replicate (num-1) 'a' ++ "b")
where
size = round ((0.7 :: Double) * fromIntegral num)
benchSepBy1 :: [Benchmark]
benchSepBy1 =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf
(parse (sepBy1 (char 'a') (char 'b') :: Parser String) "")
(pack $ genString num)
genString 0 = "ac"
genString i = 'a' : 'b' : genString (i-1)
benchBunch :: (Int -> String -> b) -> [Benchmark]
benchBunch f =
[ bgroup "match" $ benchBunchMatch f
, bgroup "nomatch_early" $ benchBunchNoMatchEarly f
, bgroup "nomatch_late" $ benchBunchNoMatchLate f
]
benchBunchMatch :: (Int -> String -> b) -> [Benchmark]
benchBunchMatch f =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf (f num) (replicate num 'a')
benchBunchNoMatchEarly :: (Int -> String -> b) -> [Benchmark]
benchBunchNoMatchEarly f =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf (f num) (replicate num 'b')
benchBunchNoMatchLate :: (Int -> String -> b) -> [Benchmark]
benchBunchNoMatchLate f =
map benchOne [benchSize,benchSize*2..benchSize*benchSteps]
where
benchOne num = bench (show num) $ whnf (f num) (replicate (num-1) 'a' ++ "b")

View File

@ -50,6 +50,10 @@ extra-doc-files: AUTHORS.md
, CHANGELOG.md
, README.md
source-repository head
type: git
location: https://github.com/mrkkrp/megaparsec.git
flag dev
description: Turn on development settings.
manual: True
@ -139,21 +143,30 @@ test-suite tests
default-language: Haskell2010
benchmark benchmarks
benchmark bench-speed
main-is: Main.hs
hs-source-dirs: benchmarks
hs-source-dirs: bench-speed
type: exitcode-stdio-1.0
build-depends: base >= 4.6 && < 5.0
, criterion >= 0.6.2.1 && < 1.2
, deepseq >= 1.3 && < 1.5
, megaparsec >= 5.1.2
if flag(dev)
ghc-options: -O2 -Wall -Werror
else
ghc-options: -O2 -Wall
build-depends: base >= 4.6 && < 5.0
, bytestring >= 0.10 && < 0.11
, criterion >= 0.6.2.1 && < 1.2
, megaparsec >= 5.1.2
, text >= 0.2 && < 1.3
default-language: Haskell2010
source-repository head
type: git
location: https://github.com/mrkkrp/megaparsec.git
benchmark bench-memory
main-is: Main.hs
hs-source-dirs: bench-memory
type: exitcode-stdio-1.0
build-depends: base >= 4.6 && < 5.0
, deepseq >= 1.3 && < 1.5
, megaparsec >= 5.1.2
, weigh >= 0.0.3
if flag(dev)
ghc-options: -O2 -Wall -Werror
else
ghc-options: -O2 -Wall
default-language: Haskell2010

View File

@ -1,3 +1,3 @@
resolver: lts-7.14
resolver: lts-7.17
packages:
- '.'