1
1
mirror of https://github.com/github/semantic.git synced 2024-12-22 14:21:31 +03:00
semantic/src/TreeSitter.hs

89 lines
4.6 KiB
Haskell
Raw Normal View History

module TreeSitter where
import Diff
import Range
import Parser
import Term
2015-12-16 23:49:46 +03:00
import qualified Data.Set as Set
import Foreign
import Foreign.C
import Foreign.C.Types
2015-12-15 21:29:58 +03:00
import qualified Data.Text as T
data TSLanguage = TsLanguage deriving (Show, Eq)
foreign import ccall "prototype/doubt-difftool/doubt-difftool-Bridging-Header.h ts_language_c" ts_language_c :: Ptr TSLanguage
foreign import ccall "prototype/doubt-difftool/doubt-difftool-Bridging-Header.h ts_language_javascript" ts_language_javascript :: Ptr TSLanguage
data TSDocument = TsDocument deriving (Show, Eq)
foreign import ccall "prototype/External/tree-sitter/include/tree_sitter/runtime.h ts_document_make" ts_document_make :: IO (Ptr TSDocument)
foreign import ccall "prototype/External/tree-sitter/include/tree_sitter/runtime.h ts_document_set_language" ts_document_set_language :: Ptr TSDocument -> Ptr TSLanguage -> IO ()
foreign import ccall "prototype/External/tree-sitter/include/tree_sitter/runtime.h ts_document_set_input_string" ts_document_set_input_string :: Ptr TSDocument -> CString -> IO ()
foreign import ccall "prototype/External/tree-sitter/include/tree_sitter/runtime.h ts_document_parse" ts_document_parse :: Ptr TSDocument -> IO ()
foreign import ccall "prototype/External/tree-sitter/include/tree_sitter/runtime.h ts_document_free" ts_document_free :: Ptr TSDocument -> IO ()
data TSLength = TsLength { bytes :: CSize, chars :: CSize }
deriving (Show, Eq)
data TSNode = TsNode { _data :: Ptr (), offset :: TSLength }
deriving (Show, Eq)
instance Storable TSNode where
2015-12-14 23:52:39 +03:00
alignment _ = 24
sizeOf _ = 24
peek _ = error "Haskell code should never read TSNode values directly."
poke _ _ = error "Haskell code should never write TSNode values directly."
foreign import ccall "app/bridge.h ts_document_root_node_p" ts_document_root_node_p :: Ptr TSDocument -> Ptr TSNode -> IO ()
foreign import ccall "app/bridge.h ts_node_p_name" ts_node_p_name :: Ptr TSNode -> Ptr TSDocument -> IO CString
foreign import ccall "app/bridge.h ts_node_p_named_child_count" ts_node_p_named_child_count :: Ptr TSNode -> IO CSize
foreign import ccall "app/bridge.h ts_node_p_named_child" ts_node_p_named_child :: Ptr TSNode -> CSize -> Ptr TSNode -> IO CSize
2015-12-17 22:56:43 +03:00
foreign import ccall "app/bridge.h ts_node_p_start_char" ts_node_p_start_char :: Ptr TSNode -> CSize
foreign import ccall "app/bridge.h ts_node_p_end_char" ts_node_p_end_char :: Ptr TSNode -> CSize
data Language = Language { getTsLanguage :: Ptr TSLanguage, getConstructor :: Constructor }
languageForType :: String -> Maybe Language
languageForType mediaType = case mediaType of
".h" -> c
".c" -> c
2015-12-17 02:10:39 +03:00
".js" -> Just . Language ts_language_javascript $ constructorForProductions
(Set.fromList [ "object" ])
(Set.fromList [ "pair", "rel_op", "math_op", "bool_op", "bitwise_op", "type_op", "math_assignment", "assignment", "subscript_access", "member_access", "new_expression", "function_call", "function", "ternary" ])
_ -> Nothing
where c = Just . Language ts_language_c $ constructorForProductions mempty (Set.fromList [ "assignment_expression", "logical_expression", "pointer_expression", "field_expression", "relational_expression", "designator", "call_expression", "math_expression" ])
parseTreeSitterFile :: Language -> Parser
parseTreeSitterFile (Language language constructor) contents = do
document <- ts_document_make
ts_document_set_language document language
2015-12-15 21:29:58 +03:00
withCString (T.unpack contents) (\source -> do
ts_document_set_input_string document source
ts_document_parse document
term <- documentToTerm constructor document contents
ts_document_free document
return term)
documentToTerm :: Constructor -> Ptr TSDocument -> Parser
documentToTerm constructor document contents = alloca $ \root -> do
ts_document_root_node_p document root
snd <$> toTerm root where
2015-12-15 21:29:58 +03:00
toTerm :: Ptr TSNode -> IO (T.Text, Term T.Text Info)
toTerm node = do
name <- ts_node_p_name node document
2015-12-15 21:29:58 +03:00
name <- T.pack <$> peekCString name
children <- withNamedChildren node toTerm
2015-12-17 22:56:43 +03:00
return (name, constructor contents (Info (range node) $ Set.singleton name) children)
2015-12-15 21:29:58 +03:00
withNamedChildren :: Ptr TSNode -> (Ptr TSNode -> IO (T.Text, a)) -> IO [(T.Text, a)]
withNamedChildren node transformNode = do
count <- ts_node_p_named_child_count node
if count == 0
then return []
else mapM (alloca . getChild) [0..pred count] where
getChild n out = do
2015-12-14 23:52:39 +03:00
_ <- ts_node_p_named_child node n out
transformNode out
2015-12-17 22:56:43 +03:00
range :: Ptr TSNode -> Range
range node = Range { start = fromIntegral $ ts_node_p_start_char node, end = fromIntegral $ ts_node_p_end_char node }