tock-mirror/common/FlowGraph.hs

{-
Tock: a compiler for parallel languages
Copyright (C) 2007  University of Kent

This program is free software; you can redistribute it and/or modify it
under the terms of the GNU General Public License as published by the
Free Software Foundation, either version 2 of the License, or (at your
option) any later version.

This program is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
General Public License for more details.

You should have received a copy of the GNU General Public License along
with this program.  If not, see <http://www.gnu.org/licenses/>.
-}


-- | The module for building control-flow graphs.  Most statements are merely processed as-is (one statement becomes one node).
-- The only cases of interest are the control structures.
--
-- * Seq blocks are merely strung together with ESeq edges.
--
-- * Par blocks have a dummy begin and end node.  The begin node has outgoing links
-- to all the members (EStartPar n), and the end nodes of each of the members has
-- a link (EEndPar n) back to the the dummy end node.  Thus all the par members thread
-- back through the same common node at the end.
--
-- * While loops have a condition node representing the test-expression.  This condition node
-- has an ESeq link out to the body of the while loop, and there is an ESeq link back from the
-- end of the while loop to the condition node.  It is the condition node that is linked
-- to nodes before and after it.
--
-- * Case statements have a slight optimisation.  Technically, the cases are examined in some
-- (probably undefined) order, with an Else option coming last.  But since the expressions
-- to check against are constant, I have chosen to represent case statements as follows:
-- There is a dummy begin node with the test-expression.  This has ESeq links to all possible options.
-- The end of each option links back to a dummy end node.
--
-- * If statements, on the other hand, have to be chained together.  Each expression is connected
-- to its body, but also to the next expression.  There is no link between the last expression
-- and the end of the if; if statements behave like STOP if nothing is matched.
module FlowGraph (EdgeLabel(..), FNode(..), FlowGraph, GraphLabelFuncs(..), buildFlowGraph, makeFlowGraphInstr) where

import Control.Monad.Error
import Control.Monad.State
import Data.Generics
import Data.Graph.Inductive

import qualified AST as A
import Metadata
import TreeUtil
import Utils

-- | A node will either have zero links out, one or more Seq links, or one or more Par links.
-- Zero links means it is a terminal node.
-- One Seq link means a normal sequential progression.
-- Multiple Seq links means choice.
-- Multiple Par links means a parallel branch.  All outgoing par links should have the same identifier,
-- and this identifier is unique and matches a later endpar link
data EdgeLabel = ESeq | EStartPar Int | EEndPar Int deriving (Show, Eq, Ord)

--If is (previous condition) (final node)
data OuterType = None | Seq | Par | Case (Node,Node) | If Node Node

newtype FNode a = Node (Meta, a)
--type FEdge = (Node, EdgeLabel, Node)

instance Show a => Show (FNode a) where
  show (Node (m,x)) = (filter ((/=) '\"')) $ show m ++ ":" ++ show x

type FlowGraph a = Gr (FNode a) EdgeLabel

type NodesEdges a = ([LNode (FNode a)],[LEdge EdgeLabel])

type GraphMaker m a b = ErrorT String (StateT (Node, Int, NodesEdges a) m) b

data Monad m => GraphLabelFuncs m label = GLF {
     labelDummy :: Meta -> m label
    ,labelProcess :: A.Process -> m label
    ,labelExpression :: A.Expression -> m label
    ,labelExpressionList :: A.ExpressionList -> m label
    ,labelScopeIn :: A.Specification -> m label
    ,labelScopeOut :: A.Specification -> m label
  }

-- | Builds the instructions to send to GraphViz
makeFlowGraphInstr :: Show a => FlowGraph a -> String
makeFlowGraphInstr = graphviz'

-- The primary reason for having the blank generator take a Meta as an argument is actually for testing.  But other uses can simply ignore it if they want.
buildFlowGraph :: Monad m => GraphLabelFuncs m a -> A.Structured -> m (Either String (FlowGraph a))
buildFlowGraph funcs s
  = do res <- runStateT (runErrorT $ buildStructured None s) (0, 0, ([],[]) )
       return $ case res of
                  (Left err,_) -> Left err
                  (_,(_,_,(nodes, edges))) -> Right (mkGraph nodes edges)
  where
    -- All the functions return the new graph, and the identifier of the node just added

-- Type commented out because it's not technically correct, but looks right to me:
--    run :: Monad m => (GraphLabelFuncs m a -> (b -> m a)) -> b -> m a
    run func = func funcs

    addNode :: Monad m => (Meta, a) -> GraphMaker m a Node
    addNode x = do (n,pi,(nodes, edges)) <- get
                   put (n+1, pi,((n, Node x):nodes, edges))
                   return n

    addEdge :: Monad m => EdgeLabel -> Node -> Node -> GraphMaker m a ()
    addEdge label start end = do (n, pi, (nodes, edges)) <- get
                                 put (n + 1, pi, (nodes,(start, end, label):edges))

-- Type commented out because it's not technically correct, but looks right to me:
--    addNode' :: Monad m => Meta -> (GraphLabelFuncs m a -> (b -> m a)) -> b -> GraphMaker m a Node
    addNode' m f t = do val <- (lift . lift) (run f t)
                        addNode (m, val)

-- Type commented out because it's not technically correct, but looks right to me:
--    addDummyNode :: Meta -> GraphMaker m a Node
    addDummyNode m = addNode' m labelDummy m

    addParEdges :: Monad m => Node -> Node -> [(Node,Node)] -> GraphMaker m a ()
    addParEdges s e pairs = do (n,pi,(nodes,edges)) <- get
                               put (n,pi+1,(nodes,edges ++ (concatMap (parEdge pi) pairs)))
      where
        parEdge :: Int -> (Node, Node) -> [LEdge EdgeLabel]
        parEdge id (a,z) = [(s,a,(EStartPar id)),(z,e,(EEndPar id))]

    -- Returns a pair of beginning-node, end-node
-- Type commented out because it's not technically correct, but looks right to me:
--    buildStructured :: OuterType -> A.Structured -> GraphMaker m a (Node, Node)
    buildStructured outer (A.Several m ss)
      = do case outer of
             None -> -- If there is no context, they should be left as disconnected graphs.
                     do nodes <- mapM (buildStructured outer) ss
                        n <- addDummyNode m
                        return (n, n)
             Seq -> do nodes <- mapM (buildStructured outer) ss
                       sequence_ $ mapPairs (\(_,s) (e,_) -> addEdge ESeq s e) nodes
                       case nodes of
                         [] -> do n <- addDummyNode m
                                  return (n,n)
                         _ -> return (fst (head nodes), snd (last nodes))
             Par -> do nodes <- mapM (buildStructured outer) ss
                       case nodes of
                         [] -> do n <- addDummyNode m
                                  return (n,n)
                         [(s,e)] -> return (s,e)
                         _ -> do
                           nStart <- addDummyNode m
                           nEnd <- addDummyNode m
                           addParEdges nStart nEnd nodes
                           return (nStart, nEnd)
             --Because the conditions in If statements are chained together, we
             --must fold the specs, not map them independently
             If prev end -> foldM foldIf (prev,end) ss
               where
                 -- Type commented out because it's not technically correct, but looks right to me:
                 -- foldIf :: (Node,Node) -> A.Structured -> GraphMaker m a (Node, Node)
                 foldIf (prev,end) s = do (prev',_) <- buildStructured (If prev end) s
                                          return (prev', end)
             _ -> do nodes <- mapM (buildStructured outer) ss
                     return (-1,-1)
    buildStructured _ (A.OnlyP _ p) = buildProcess p
    buildStructured outer (A.OnlyC _ (A.Choice m exp p))
      = do nexp <- addNode' m labelExpression exp
           (nbodys, nbodye) <- buildProcess p
           addEdge ESeq nexp nbodys
           case outer of
             If cPrev cEnd ->
               do addEdge ESeq cPrev nexp
                  addEdge ESeq nbodye cEnd
             _ -> throwError "Choice found outside IF statement"
           return (nexp,nbodye)
    buildStructured outer (A.OnlyO _ opt)
      = do (s,e) <-
             case opt of
               (A.Option m es p) -> do
                 nexp <- addNode' m labelExpressionList (A.ExpressionList m es)
                 (nbodys, nbodye) <- buildProcess p
                 addEdge ESeq nexp nbodys
                 return (nexp,nbodye)
               (A.Else _ p) -> buildProcess p
           case outer of
             Case (cStart, cEnd) ->
               do addEdge ESeq cStart s
                  addEdge ESeq e cEnd
             _ -> throwError "Option found outside CASE statement"
           return (s,e)
    buildStructured outer (A.Spec m spec str)
      = do n <- addNode' m labelScopeIn spec
           n' <- addNode' m labelScopeOut spec
           (s,e) <- buildStructured outer str
           addEdge ESeq n s
           addEdge ESeq e n'
           return (n,n')
    buildStructured _ s = do n <- addDummyNode (findMeta s)
                             return (n,n)

-- Type commented out because it's not technically correct, but looks right to me:
--    buildProcess :: A.Process -> GraphMaker m a (Node, Node)
    buildProcess (A.Seq _ s) = buildStructured Seq s
    buildProcess (A.Par _ _ s) = buildStructured Par s
    buildProcess (A.While m e p)
      = do n <- addNode' m labelExpression e
           (start, end) <- buildProcess p
           addEdge ESeq n start
           addEdge ESeq end n
           return (n, n)
    buildProcess (A.Case m e s)
      = do nStart <- addNode' (findMeta e) labelExpression e
           nEnd <- addDummyNode m
           buildStructured (Case (nStart,nEnd)) s
           return (nStart, nEnd)
    buildProcess (A.If m s)
      = do nStart <- addDummyNode m
           nEnd <- addDummyNode m
           buildStructured (If nStart nEnd) s
           return (nStart, nEnd)
    buildProcess p = do (liftM mkPair) $ addNode' (findMeta p) labelProcess p

decomp22 :: (Monad m, Data a, Typeable a0, Typeable a1) => (a0 -> a1 -> a) -> (a1 -> m a1) -> (a -> m a)
decomp22 con f1 = decomp2 con return f1

decomp23 :: (Monad m, Data a, Typeable a0, Typeable a1, Typeable a2) => (a0 -> a1 -> a2 -> a) -> (a1 -> m a1) -> (a -> m a)
decomp23 con f1 = decomp3 con return f1 return

decomp33 :: (Monad m, Data a, Typeable a0, Typeable a1, Typeable a2) => (a0 -> a1 -> a2 -> a) -> (a2 -> m a2) -> (a -> m a)
decomp33 con f2 = decomp3 con return return f2