1
1
mirror of https://github.com/github/semantic.git synced 2025-01-08 08:30:27 +03:00
semantic/src/Source.hs

118 lines
4.7 KiB
Haskell
Raw Normal View History

{-# LANGUAGE GeneralizedNewtypeDeriving #-}
{-# OPTIONS_GHC -funbox-strict-fields #-}
2015-12-24 06:38:02 +03:00
module Source where
import Prologue hiding (uncons)
import Data.Text (unpack, pack)
import Data.String
import qualified Data.Vector as Vector
2016-03-08 03:20:28 +03:00
import Numeric
import Range
import SourceSpan
2016-07-29 20:03:11 +03:00
-- | The source, oid, path, and Maybe SourceKind of a blob in a Git repo.
data SourceBlob = SourceBlob { source :: Source Char, oid :: String, path :: FilePath, blobKind :: Maybe SourceKind }
deriving (Show, Eq)
-- | The contents of a source file, backed by a vector for efficient slicing.
newtype Source a = Source { getVector :: Vector.Vector a }
deriving (Eq, Show, Foldable, Functor, Traversable)
-- | The kind of a blob, along with it's file mode.
2016-03-08 03:20:28 +03:00
data SourceKind = PlainBlob Word32 | ExecutableBlob Word32 | SymlinkBlob Word32
2016-03-08 02:50:32 +03:00
deriving (Show, Eq)
2016-03-04 00:29:03 +03:00
2016-03-04 01:09:46 +03:00
modeToDigits :: SourceKind -> String
2016-03-08 03:20:28 +03:00
modeToDigits (PlainBlob mode) = showOct mode ""
modeToDigits (ExecutableBlob mode) = showOct mode ""
modeToDigits (SymlinkBlob mode) = showOct mode ""
2016-03-04 01:09:46 +03:00
2016-01-27 00:25:40 +03:00
2016-03-09 00:04:44 +03:00
-- | The default plain blob mode
defaultPlainBlob :: SourceKind
defaultPlainBlob = PlainBlob 0o100644
emptySourceBlob :: FilePath -> SourceBlob
emptySourceBlob filepath = SourceBlob (Source.fromList "") Source.nullOid filepath Nothing
sourceBlob :: Source Char -> FilePath -> SourceBlob
sourceBlob source filepath = SourceBlob source Source.nullOid filepath (Just defaultPlainBlob)
-- | Map blobs with Nothing blobKind to empty blobs.
idOrEmptySourceBlob :: SourceBlob -> SourceBlob
2016-06-02 00:41:28 +03:00
idOrEmptySourceBlob blob = if isNothing (blobKind blob)
then blob { oid = nullOid, blobKind = Nothing }
else blob
nullOid :: String
nullOid = "0000000000000000000000000000000000000000"
2016-01-13 23:50:52 +03:00
-- | Return a Source from a list of items.
2015-12-24 07:37:51 +03:00
fromList :: [a] -> Source a
fromList = Source . Vector.fromList
2016-01-13 23:50:52 +03:00
-- | Return a Source of Chars from a Text.
fromText :: Text -> Source Char
fromText = Source . Vector.fromList . unpack
2015-12-30 01:34:52 +03:00
2016-01-13 23:50:52 +03:00
-- | Return a Source that contains a slice of the given Source.
2015-12-24 07:25:00 +03:00
slice :: Range -> Source a -> Source a
2016-01-12 19:56:36 +03:00
slice range = Source . Vector.slice (start range) (rangeLength range) . getVector
2016-01-13 23:50:52 +03:00
-- | Return a String with the contents of the Source.
toString :: Source Char -> String
2015-12-24 07:26:37 +03:00
toString = toList
-- | Return a text with the contents of the Source.
toText :: Source Char -> Text
toText = pack . toList
2016-01-13 23:50:52 +03:00
-- | Return the item at the given index.
at :: Source a -> Int -> a
2015-12-24 07:29:27 +03:00
at = (Vector.!) . getVector
2016-01-13 23:50:52 +03:00
-- | Remove the first item and return it with the rest of the source.
2015-12-24 07:05:01 +03:00
uncons :: Source a -> Maybe (a, Source a)
uncons (Source vector) = if null vector then Nothing else Just (Vector.head vector, Source $ Vector.tail vector)
2015-12-24 07:16:09 +03:00
2016-01-13 23:50:52 +03:00
-- | Split the source into the longest prefix of elements that do not satisfy the predicate and the rest without copying.
2015-12-24 07:16:09 +03:00
break :: (a -> Bool) -> Source a -> (Source a, Source a)
2015-12-24 07:23:16 +03:00
break predicate (Source vector) = let (start, remainder) = Vector.break predicate vector in (Source start, Source remainder)
2015-12-24 07:41:08 +03:00
2016-01-14 00:20:29 +03:00
-- | Split the contents of the source after newlines.
actualLines :: Source Char -> [Source Char]
actualLines source | null source = [ source ]
actualLines source = case Source.break (== '\n') source of
(l, lines') -> case uncons lines' of
Nothing -> [ l ]
2016-09-13 18:45:30 +03:00
Just (_, lines') -> (l <> fromList "\n") : actualLines lines'
-- | Compute the line ranges within a given range of a string.
actualLineRanges :: Range -> Source Char -> [Range]
actualLineRanges range = drop 1 . scanl toRange (Range (start range) (start range)) . actualLines . slice range
where toRange previous string = Range (end previous) $ end previous + length string
2016-05-21 05:38:55 +03:00
2016-10-06 00:27:45 +03:00
-- | Compute the character range given a Source and a SourceSpan.
sourceSpanToRange :: Source Char -> SourceSpan -> Range
2016-09-13 19:23:47 +03:00
sourceSpanToRange source SourceSpan{..} = Range start end
2016-09-13 19:25:55 +03:00
where start = sumLengths leadingRanges + column spanStart
end = start + sumLengths (take (line spanEnd - line spanStart) remainingRanges) + (column spanEnd - column spanStart)
2016-09-13 19:23:47 +03:00
(leadingRanges, remainingRanges) = splitAt (line spanStart) (actualLineRanges (totalRange source) source)
2016-09-13 19:25:55 +03:00
sumLengths = sum . fmap (\ Range{..} -> end - start)
2016-10-11 22:09:24 +03:00
rangeToSourceSpan :: Source Char -> Range -> SourceSpan
rangeToSourceSpan source range@Range{} = SourceSpan startPos endPos
where startPos = maybe (SourcePos 1 1) (toStartPos 1) (head lineRanges)
2016-12-02 00:03:45 +03:00
endPos = toEndPos (length lineRanges) (fromMaybe (rangeAt 0) (snd <$> unsnoc lineRanges))
2016-10-06 00:27:45 +03:00
lineRanges = actualLineRanges range source
toStartPos line range = SourcePos line (start range)
toEndPos line range = SourcePos line (end range)
2016-05-21 05:38:55 +03:00
2016-09-18 03:54:07 +03:00
instance Semigroup (Source a) where
Source a <> Source b = Source (a Vector.++ b)
2016-05-21 05:38:55 +03:00
instance Monoid (Source a) where
mempty = fromList []
2016-09-18 03:54:07 +03:00
mappend = (<>)