1
1
mirror of https://github.com/github/semantic.git synced 2025-01-02 12:23:08 +03:00
semantic/src/Algorithm.hs

196 lines
8.7 KiB
Haskell
Raw Normal View History

2017-09-18 07:23:14 +03:00
{-# LANGUAGE DataKinds, DefaultSignatures, GADTs, RankNTypes, TypeOperators, UndecidableInstances #-}
2015-11-18 03:20:52 +03:00
module Algorithm where
2015-11-18 03:24:01 +03:00
import Control.Applicative (Alternative(..))
import Control.Monad (guard)
2017-09-09 13:23:57 +03:00
import Control.Monad.Free.Freer
import Data.Functor.Classes
import Data.List.NonEmpty (NonEmpty(..))
2017-07-28 21:37:02 +03:00
import Data.Maybe
import Data.Proxy
import Data.These
2017-07-21 00:15:01 +03:00
import Data.Union
import Diff
import GHC.Generics
import Term
2016-08-04 01:12:31 +03:00
2017-02-21 18:26:27 +03:00
-- | A single step in a diffing algorithm, parameterized by the types of terms, diffs, and the result of the applicable algorithm.
2017-09-14 22:17:22 +03:00
data AlgorithmF term diff result where
-- | Diff two terms with the choice of algorithm left to the interpreters discretion.
2017-09-14 22:17:22 +03:00
Diff :: term ann1 -> term ann2 -> AlgorithmF term (diff ann1 ann2) (diff ann1 ann2)
2017-02-21 18:38:10 +03:00
-- | Diff two terms recursively in O(n) time, resulting in a single diff node.
2017-09-14 22:17:22 +03:00
Linear :: term ann1 -> term ann2 -> AlgorithmF term (diff ann1 ann2) (diff ann1 ann2)
2017-02-21 18:38:10 +03:00
-- | Diff two lists of terms by each elements similarity in O(n³ log n), resulting in a list of diffs.
2017-09-14 22:17:22 +03:00
RWS :: [term ann1] -> [term ann2] -> AlgorithmF term (diff ann1 ann2) [diff ann1 ann2]
2017-09-19 17:02:26 +03:00
-- | Delete a term.
2017-09-14 22:17:22 +03:00
Delete :: term ann1 -> AlgorithmF term (diff ann1 ann2) (diff ann1 ann2)
-- | Insert a term.
2017-09-14 22:17:22 +03:00
Insert :: term ann2 -> AlgorithmF term (diff ann1 ann2) (diff ann1 ann2)
-- | Replace one term with another.
2017-09-14 22:17:22 +03:00
Replace :: term ann1 -> term ann2 -> AlgorithmF term (diff ann1 ann2) (diff ann1 ann2)
2017-09-19 14:21:31 +03:00
-- | An 'Algorithm' that always fails.
Empty :: AlgorithmF term diff a
2017-09-19 14:21:31 +03:00
-- | An 'Algorithm' to try one of two alternatives.
Alt :: a -> a -> AlgorithmF term diff a
2017-09-19 17:52:47 +03:00
-- | The free(r) monad for 'AlgorithmF'. This enables us to construct algorithms to diff using '<$>', '<*>', '>>=', and do-notation.
2017-09-14 22:17:22 +03:00
type Algorithm term diff = Freer (AlgorithmF term diff)
2016-08-04 19:08:34 +03:00
-- DSL
-- | Diff two terms without specifying the algorithm to be used.
2017-09-14 22:17:22 +03:00
diff :: term ann1 -> term ann2 -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
2017-09-09 13:23:57 +03:00
diff = (liftF .) . Algorithm.Diff
2017-02-23 20:30:26 +03:00
-- | Diff a These of terms without specifying the algorithm to be used.
2017-09-14 22:17:22 +03:00
diffThese :: These (term ann1) (term ann2) -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
diffThese = these byDeleting byInserting diff
-- | Diff a pair of optional terms without specifying the algorithm to be used.
2017-09-14 22:17:22 +03:00
diffMaybe :: Maybe (term ann1) -> Maybe (term ann2) -> Algorithm term (diff ann1 ann2) (Maybe (diff ann1 ann2))
diffMaybe (Just a) (Just b) = Just <$> diff a b
diffMaybe (Just a) _ = Just <$> byDeleting a
diffMaybe _ (Just b) = Just <$> byInserting b
diffMaybe _ _ = pure Nothing
-- | Diff two terms linearly.
2017-09-14 22:17:22 +03:00
linearly :: term ann1 -> term ann2 -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
linearly a b = liftF (Linear a b)
-- | Diff two terms using RWS.
2017-09-14 22:17:22 +03:00
byRWS :: [term ann1] -> [term ann2] -> Algorithm term (diff ann1 ann2) [diff ann1 ann2]
byRWS a b = liftF (RWS a b)
-- | Delete a term.
2017-09-14 22:17:22 +03:00
byDeleting :: term ann1 -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
byDeleting = liftF . Delete
-- | Insert a term.
2017-09-14 22:17:22 +03:00
byInserting :: term ann2 -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
byInserting = liftF . Insert
-- | Replace one term with another.
2017-09-14 22:17:22 +03:00
byReplacing :: term ann1 -> term ann2 -> Algorithm term (diff ann1 ann2) (diff ann1 ann2)
byReplacing = (liftF .) . Replace
2017-09-14 22:17:22 +03:00
instance (Show1 term, Show ann1, Show ann2) => Show1 (AlgorithmF term (diff ann1 ann2)) where
liftShowsPrec sp _ d algorithm = case algorithm of
2017-09-14 01:59:38 +03:00
Algorithm.Diff t1 t2 -> showsBinaryWith showsTerm showsTerm "Diff" d t1 t2
Linear t1 t2 -> showsBinaryWith showsTerm showsTerm "Linear" d t1 t2
RWS as bs -> showsBinaryWith (liftShowsPrec showsTerm (liftShowList showsPrec showList)) (liftShowsPrec showsTerm (liftShowList showsPrec showList)) "RWS" d as bs
Delete t1 -> showsUnaryWith showsTerm "Delete" d t1
Insert t2 -> showsUnaryWith showsTerm "Insert" d t2
Replace t1 t2 -> showsBinaryWith showsTerm showsTerm "Replace" d t1 t2
Empty -> showString "Empty"
Alt a b -> showsBinaryWith sp sp "Alt" d a b
2017-09-14 22:08:43 +03:00
where showsTerm :: (Show1 term, Show ann) => Int -> term ann -> ShowS
2017-09-14 01:59:38 +03:00
showsTerm = liftShowsPrec showsPrec showList
2017-07-21 00:15:01 +03:00
instance Alternative (Algorithm term diff) where
empty = Empty `Then` return
2017-09-19 15:23:33 +03:00
(Empty `Then` _) <|> b = b
a <|> (Empty `Then` _) = a
a <|> b = Alt a b `Then` id
2017-07-21 03:21:20 +03:00
-- | Diff two terms based on their generic Diffable instances. If the terms are not diffable
-- (represented by a Nothing diff returned from algorithmFor) replace one term with another.
algorithmForTerms :: Diffable syntax
=> Term syntax ann1
-> Term syntax ann2
2017-09-14 22:17:22 +03:00
-> Algorithm (Term syntax) (Diff syntax ann1 ann2) (Diff syntax ann1 ann2)
algorithmForTerms (Term (In ann1 f1)) (Term (In ann2 f2)) = merge (ann1, ann2) <$> algorithmFor f1 f2
2017-07-21 00:15:01 +03:00
2017-07-21 03:21:20 +03:00
-- | A type class for determining what algorithm to use for diffing two terms.
2017-07-21 00:15:01 +03:00
class Diffable f where
algorithmFor :: f (term ann1)
-> f (term ann2)
-> Algorithm term (diff ann1 ann2) (f (diff ann1 ann2))
default
algorithmFor :: (Generic1 f, GDiffable (Rep1 f))
=> f (term ann1)
-> f (term ann2)
-> Algorithm term (diff ann1 ann2) (f (diff ann1 ann2))
algorithmFor = genericAlgorithmFor
2017-09-19 21:02:08 +03:00
subalgorithmFor :: (a -> Algorithm term (diff ann1 ann2) b)
-> (a -> Algorithm term (diff ann1 ann2) b)
-> f a
-> Algorithm term (diff ann1 ann2) (f b)
default
subalgorithmFor :: Traversable f
=> (a -> Algorithm term (diff ann1 ann2) b)
-> (a -> Algorithm term (diff ann1 ann2) b)
-> f a
-> Algorithm term (diff ann1 ann2) (f b)
subalgorithmFor _ _ _ = empty
genericAlgorithmFor :: (Generic1 f, GDiffable (Rep1 f)) => f (term ann1) -> f (term ann2) -> Algorithm term (diff ann1 ann2) (f (diff ann1 ann2))
genericAlgorithmFor a b = to1 <$> galgorithmFor (from1 a) (from1 b)
2017-07-21 00:15:01 +03:00
2017-07-21 03:25:27 +03:00
-- | Diff a Union of Syntax terms. Left is the "rest" of the Syntax terms in the Union,
2017-07-21 20:50:53 +03:00
-- Right is the "head" of the Union. 'weaken' relaxes the Union to allow the possible
-- diff terms from the "rest" of the Union, and 'inj' adds the diff terms into the Union.
2017-07-21 03:21:20 +03:00
-- NB: If Left or Right Syntax terms in our Union don't match, we fail fast by returning Nothing.
2017-09-18 07:23:14 +03:00
instance Apply Diffable fs => Diffable (Union fs) where
algorithmFor u1 u2 = fromMaybe empty (apply2' (Proxy :: Proxy Diffable) (\ inj f1 f2 -> inj <$> algorithmFor f1 f2) u1 u2)
2017-07-21 00:15:01 +03:00
2017-09-19 21:02:08 +03:00
subalgorithmFor blur focus = apply' (Proxy :: Proxy Diffable) (\ inj f1 -> inj <$> subalgorithmFor blur focus f1)
2017-09-19 19:49:34 +03:00
-- | Diff two 'Maybe's.
instance Diffable Maybe where
algorithmFor = diffMaybe
2017-09-19 19:49:34 +03:00
-- | Diff two lists using RWS.
2017-07-21 20:50:24 +03:00
instance Diffable [] where
algorithmFor a b = byRWS a b
2017-07-21 20:50:24 +03:00
-- | Diff two non-empty lists using RWS.
instance Diffable NonEmpty where
algorithmFor (a:|as) (b:|bs) = (\ (d:ds) -> d:|ds) <$> byRWS (a:as) (b:bs)
2017-07-21 03:21:20 +03:00
-- | A generic type class for diffing two terms defined by the Generic1 interface.
class GDiffable f where
galgorithmFor :: f (term ann1) -> f (term ann2) -> Algorithm term (diff ann1 ann2) (f (diff ann1 ann2))
2017-07-21 00:15:01 +03:00
2017-07-21 20:50:53 +03:00
-- | Diff two constructors (M1 is the Generic1 newtype for meta-information (possibly related to type constructors, record selectors, and data types))
instance GDiffable f => GDiffable (M1 i c f) where
galgorithmFor (M1 a) (M1 b) = M1 <$> galgorithmFor a b
2017-07-21 00:15:01 +03:00
2017-07-21 20:50:53 +03:00
-- | Diff the fields of a product type.
-- i.e. data Foo a b = Foo a b (the 'Foo a b' is captured by 'a :*: b').
instance (GDiffable f, GDiffable g) => GDiffable (f :*: g) where
galgorithmFor (a1 :*: b1) (a2 :*: b2) = (:*:) <$> galgorithmFor a1 a2 <*> galgorithmFor b1 b2
2017-07-21 00:15:01 +03:00
2017-07-21 20:50:53 +03:00
-- | Diff the constructors of a sum type.
-- i.e. data Foo a = Foo a | Bar a (the 'Foo a' is captured by L1 and 'Bar a' is R1).
instance (GDiffable f, GDiffable g) => GDiffable (f :+: g) where
galgorithmFor (L1 a) (L1 b) = L1 <$> galgorithmFor a b
galgorithmFor (R1 a) (R1 b) = R1 <$> galgorithmFor a b
galgorithmFor _ _ = empty
2017-07-21 00:15:01 +03:00
2017-07-21 03:21:20 +03:00
-- | Diff two parameters (Par1 is the Generic1 newtype representing a type parameter).
2017-07-21 20:50:53 +03:00
-- i.e. data Foo a = Foo a (the 'a' is captured by Par1).
instance GDiffable Par1 where
galgorithmFor (Par1 a) (Par1 b) = Par1 <$> linearly a b
2017-07-21 00:15:01 +03:00
2017-07-21 03:21:20 +03:00
-- | Diff two constant parameters (K1 is the Generic1 newtype representing type parameter constants).
2017-07-21 20:50:53 +03:00
-- i.e. data Foo = Foo Int (the 'Int' is a constant parameter).
instance Eq c => GDiffable (K1 i c) where
galgorithmFor (K1 a) (K1 b) = guard (a == b) *> pure (K1 a)
2017-07-21 00:15:01 +03:00
2017-07-21 03:21:20 +03:00
-- | Diff two terms whose constructors contain 0 type parameters.
-- i.e. data Foo = Foo.
instance GDiffable U1 where
galgorithmFor _ _ = pure U1
2017-07-21 00:15:01 +03:00
-- | Diff two 'Diffable' containers of parameters.
instance Diffable f => GDiffable (Rec1 f) where
galgorithmFor a b = Rec1 <$> algorithmFor (unRec1 a) (unRec1 b)