forked from GitHub/gf-core
started adding GF back optimization (Factorize)
This commit is contained in:
@@ -189,7 +189,7 @@ checkCompleteGrammar abs cnc = do
|
|||||||
where
|
where
|
||||||
checkOne js i@(c, Left ju) = case jform ju of
|
checkOne js i@(c, Left ju) = case jform ju of
|
||||||
JFun -> case Map.lookup c js of
|
JFun -> case Map.lookup c js of
|
||||||
Just (Left j) | jform ju == JLin -> return js
|
Just (Left j) | jform j == JLin -> return js
|
||||||
_ -> do
|
_ -> do
|
||||||
checkWarn $ "WARNING: no linearization of" +++ prt c
|
checkWarn $ "WARNING: no linearization of" +++ prt c
|
||||||
return js
|
return js
|
||||||
|
|||||||
@@ -7,14 +7,14 @@ import GF.Devel.Compile.Rename
|
|||||||
import GF.Devel.Compile.CheckGrammar
|
import GF.Devel.Compile.CheckGrammar
|
||||||
import GF.Devel.Compile.Refresh
|
import GF.Devel.Compile.Refresh
|
||||||
import GF.Devel.Compile.Optimize
|
import GF.Devel.Compile.Optimize
|
||||||
----import GF.Devel.OptimizeGF
|
import GF.Devel.Compile.Factorize
|
||||||
|
|
||||||
import GF.Devel.Grammar.Terms
|
import GF.Devel.Grammar.Terms
|
||||||
import GF.Devel.Grammar.Modules
|
import GF.Devel.Grammar.Modules
|
||||||
import GF.Devel.Grammar.Judgements
|
import GF.Devel.Grammar.Judgements
|
||||||
import GF.Infra.Ident
|
import GF.Infra.Ident
|
||||||
import GF.Devel.Grammar.PrGF
|
import GF.Devel.Grammar.PrGF
|
||||||
----import GF.Grammar.Lookup
|
----import GF.Devel.Grammar.Lookup
|
||||||
import GF.Devel.ReadFiles
|
import GF.Devel.ReadFiles
|
||||||
|
|
||||||
import GF.Infra.Option ----
|
import GF.Infra.Option ----
|
||||||
@@ -161,8 +161,10 @@ compileSourceModule opts env@(k,gr) mo@(i,mi) = do
|
|||||||
moo <- putpp " optimizing " $ ioeErr $ optimizeModule opts gr mox
|
moo <- putpp " optimizing " $ ioeErr $ optimizeModule opts gr mox
|
||||||
intermOut opts (iOpt "show_optimize") (prMod moo)
|
intermOut opts (iOpt "show_optimize") (prMod moo)
|
||||||
|
|
||||||
|
mof <- putpp " factorizing " $ ioeErr $ optimizeModule opts gr moo
|
||||||
|
intermOut opts (iOpt "show_factorize") (prMod mof)
|
||||||
|
|
||||||
return (k,moo) ----
|
return (k,mof) ----
|
||||||
|
|
||||||
|
|
||||||
{- ----
|
{- ----
|
||||||
|
|||||||
261
src/GF/Devel/Compile/Factorize.hs
Normal file
261
src/GF/Devel/Compile/Factorize.hs
Normal file
@@ -0,0 +1,261 @@
|
|||||||
|
----------------------------------------------------------------------
|
||||||
|
-- |
|
||||||
|
-- Module : OptimizeGF
|
||||||
|
-- Maintainer : AR
|
||||||
|
-- Stability : (stable)
|
||||||
|
-- Portability : (portable)
|
||||||
|
--
|
||||||
|
-- > CVS $Date: 2005/04/21 16:21:33 $
|
||||||
|
-- > CVS $Author: bringert $
|
||||||
|
-- > CVS $Revision: 1.6 $
|
||||||
|
--
|
||||||
|
-- Optimizations on GF source code: sharing, parametrization, value sets.
|
||||||
|
--
|
||||||
|
-- optimization: sharing branches in tables. AR 25\/4\/2003.
|
||||||
|
-- following advice of Josef Svenningsson
|
||||||
|
-----------------------------------------------------------------------------
|
||||||
|
|
||||||
|
module GF.Devel.Compile.Factorize (
|
||||||
|
optModule,
|
||||||
|
unshareModule,
|
||||||
|
unsubexpModule,
|
||||||
|
unoptModule,
|
||||||
|
subexpModule,
|
||||||
|
shareModule
|
||||||
|
) where
|
||||||
|
|
||||||
|
import GF.Devel.Grammar.Modules
|
||||||
|
import GF.Devel.Grammar.Judgements
|
||||||
|
import GF.Devel.Grammar.Terms
|
||||||
|
import GF.Devel.Grammar.MkJudgements
|
||||||
|
import GF.Devel.Grammar.PrGF (prt)
|
||||||
|
import qualified GF.Devel.Grammar.Macros as C
|
||||||
|
|
||||||
|
import GF.Devel.Grammar.Lookup
|
||||||
|
import GF.Infra.Ident
|
||||||
|
|
||||||
|
import GF.Data.Operations
|
||||||
|
|
||||||
|
import Control.Monad
|
||||||
|
import Data.Map (Map)
|
||||||
|
import qualified Data.Map as Map
|
||||||
|
import Data.List
|
||||||
|
|
||||||
|
optModule :: SourceModule -> SourceModule
|
||||||
|
optModule = subexpModule . shareModule
|
||||||
|
|
||||||
|
shareModule = processModule optim
|
||||||
|
|
||||||
|
unoptModule :: GF -> SourceModule -> SourceModule
|
||||||
|
unoptModule gr = unshareModule gr . unsubexpModule
|
||||||
|
|
||||||
|
unshareModule :: GF -> SourceModule -> SourceModule
|
||||||
|
unshareModule gr = processModule (const (unoptim gr))
|
||||||
|
|
||||||
|
processModule :: (Ident -> Term -> Term) -> SourceModule -> SourceModule
|
||||||
|
processModule opt (i,m) = (i, C.judgementOpModule (shareInfo (opt i)) m)
|
||||||
|
|
||||||
|
shareInfo :: (Term -> Term) -> Judgement -> Err Judgement
|
||||||
|
shareInfo opt ju = return $ ju {jdef = opt (jdef ju)}
|
||||||
|
|
||||||
|
-- the function putting together optimizations
|
||||||
|
optim :: Ident -> Term -> Term
|
||||||
|
optim c = values . factor c 0
|
||||||
|
|
||||||
|
-- we need no counter to create new variable names, since variables are
|
||||||
|
-- local to tables ----
|
||||||
|
-- factor parametric branches
|
||||||
|
|
||||||
|
factor :: Ident -> Int -> Term -> Term
|
||||||
|
factor c i t = case t of
|
||||||
|
T _ [_] -> t
|
||||||
|
T _ [] -> t
|
||||||
|
T (TComp ty) cs ->
|
||||||
|
T (TTyped ty) $ factors i [(p, factor c (i+1) v) | (p, v) <- cs]
|
||||||
|
_ -> C.composSafeOp (factor c i) t
|
||||||
|
where
|
||||||
|
|
||||||
|
factors i psvs = -- we know psvs has at least 2 elements
|
||||||
|
let p = qqIdent c i
|
||||||
|
vs' = map (mkFun p) psvs
|
||||||
|
in if allEqs vs'
|
||||||
|
then mkCase p vs'
|
||||||
|
else psvs
|
||||||
|
|
||||||
|
mkFun p (patt, val) = replace (C.patt2term patt) (Vr p) val
|
||||||
|
|
||||||
|
allEqs (v:vs) = all (==v) vs
|
||||||
|
|
||||||
|
mkCase p (v:_) = [(PV p, v)]
|
||||||
|
|
||||||
|
--- we hope this will be fresh and don't check...
|
||||||
|
|
||||||
|
qqIdent c i = identC ("_q" ++ prt c ++ "__" ++ show i)
|
||||||
|
|
||||||
|
|
||||||
|
-- we need to replace subterms
|
||||||
|
|
||||||
|
replace :: Term -> Term -> Term -> Term
|
||||||
|
replace old new trm = case trm of
|
||||||
|
|
||||||
|
-- these are the important cases, since they can correspond to patterns
|
||||||
|
QC _ _ | trm == old -> new
|
||||||
|
App t ts | trm == old -> new
|
||||||
|
App t ts -> App (repl t) (repl ts)
|
||||||
|
R _ | isRec && trm == old -> new
|
||||||
|
_ -> C.composSafeOp repl trm
|
||||||
|
where
|
||||||
|
repl = replace old new
|
||||||
|
isRec = case trm of
|
||||||
|
R _ -> True
|
||||||
|
_ -> False
|
||||||
|
|
||||||
|
-- It is very important that this is performed only after case
|
||||||
|
-- expansion since otherwise the order and number of values can
|
||||||
|
-- be incorrect. Guaranteed by the TComp flag.
|
||||||
|
|
||||||
|
values :: Term -> Term
|
||||||
|
values t = case t of
|
||||||
|
T ty [(ps,t)] -> T ty [(ps,values t)] -- don't destroy parametrization
|
||||||
|
T (TComp ty) cs -> V ty [values t | (_, t) <- cs]
|
||||||
|
T (TTyped ty) cs -> V ty [values t | (_, t) <- cs]
|
||||||
|
---- why are these left?
|
||||||
|
---- printing with GrammarToSource does not preserve the distinction
|
||||||
|
_ -> C.composSafeOp values t
|
||||||
|
|
||||||
|
|
||||||
|
-- to undo the effect of factorization
|
||||||
|
|
||||||
|
unoptim :: GF -> Term -> Term
|
||||||
|
unoptim gr = unfactor gr
|
||||||
|
|
||||||
|
unfactor :: GF -> Term -> Term
|
||||||
|
unfactor gr t = case t of
|
||||||
|
T (TTyped ty) [(PV x,u)] -> V ty [restore x v (unfac u) | v <- vals ty]
|
||||||
|
_ -> C.composSafeOp unfac t
|
||||||
|
where
|
||||||
|
unfac = unfactor gr
|
||||||
|
vals = err error id . allParamValues gr
|
||||||
|
restore x u t = case t of
|
||||||
|
Vr y | y == x -> u
|
||||||
|
_ -> C.composSafeOp (restore x u) t
|
||||||
|
|
||||||
|
|
||||||
|
----------------------------------------------------------------------
|
||||||
|
|
||||||
|
{-
|
||||||
|
This module implements a simple common subexpression elimination
|
||||||
|
for gfc grammars, to factor out shared subterms in lin rules.
|
||||||
|
It works in three phases:
|
||||||
|
|
||||||
|
(1) collectSubterms collects recursively all subterms of forms table and (P x..y)
|
||||||
|
from lin definitions (experience shows that only these forms
|
||||||
|
tend to get shared) and counts how many times they occur
|
||||||
|
(2) addSubexpConsts takes those subterms t that occur more than once
|
||||||
|
and creates definitions of form "oper A''n = t" where n is a
|
||||||
|
fresh number; notice that we assume no ids of this form are in
|
||||||
|
scope otherwise
|
||||||
|
(3) elimSubtermsMod goes through lins and the created opers by replacing largest
|
||||||
|
possible subterms by the newly created identifiers
|
||||||
|
|
||||||
|
The optimization is invoked in gf by the flag i -subs.
|
||||||
|
|
||||||
|
If an application does not support GFC opers, the effect of this
|
||||||
|
optimization can be undone by the function unSubelimCanon.
|
||||||
|
|
||||||
|
The function unSubelimCanon can be used to diagnostisize how much
|
||||||
|
cse is possible in the grammar. It is used by the flag pg -printer=subs.
|
||||||
|
|
||||||
|
-}
|
||||||
|
|
||||||
|
subexpModule :: SourceModule -> SourceModule
|
||||||
|
subexpModule (mo,m) = errVal (mo,m) $ case m of
|
||||||
|
M.ModMod (M.Module mt st fs me ops js) -> do
|
||||||
|
(tree,_) <- appSTM (getSubtermsMod mo (tree2list js)) (Map.empty,0)
|
||||||
|
js2 <- liftM buildTree $ addSubexpConsts mo tree $ tree2list js
|
||||||
|
return (mo,M.ModMod (M.Module mt st fs me ops js2))
|
||||||
|
_ -> return (mo,m)
|
||||||
|
|
||||||
|
unsubexpModule :: SourceModule -> SourceModule
|
||||||
|
unsubexpModule mo@(i,m) = case m of
|
||||||
|
M.ModMod (M.Module mt st fs me ops js) | hasSub ljs ->
|
||||||
|
(i, M.ModMod (M.Module mt st fs me ops
|
||||||
|
(rebuild (map unparInfo ljs))))
|
||||||
|
where ljs = tree2list js
|
||||||
|
_ -> (i,m)
|
||||||
|
where
|
||||||
|
-- perform this iff the module has opers
|
||||||
|
hasSub ljs = not $ null [c | (c,ResOper _ _) <- ljs]
|
||||||
|
unparInfo (c,info) = case info of
|
||||||
|
CncFun xs (Yes t) m -> [(c, CncFun xs (Yes (unparTerm t)) m)]
|
||||||
|
ResOper (Yes (EInt 8)) _ -> [] -- subexp-generated opers
|
||||||
|
ResOper pty (Yes t) -> [(c, ResOper pty (Yes (unparTerm t)))]
|
||||||
|
_ -> [(c,info)]
|
||||||
|
unparTerm t = case t of
|
||||||
|
Q m c@(IC ('A':'\'':'\'':_)) -> --- name convention of subexp opers
|
||||||
|
errVal t $ liftM unparTerm $ lookupResDef gr m c
|
||||||
|
_ -> C.composSafeOp unparTerm t
|
||||||
|
gr = M.MGrammar [mo]
|
||||||
|
rebuild = buildTree . concat
|
||||||
|
|
||||||
|
-- implementation
|
||||||
|
|
||||||
|
type TermList = Map Term (Int,Int) -- number of occs, id
|
||||||
|
type TermM a = STM (TermList,Int) a
|
||||||
|
|
||||||
|
addSubexpConsts ::
|
||||||
|
Ident -> Map Term (Int,Int) -> [(Ident,Info)] -> Err [(Ident,Info)]
|
||||||
|
addSubexpConsts mo tree lins = do
|
||||||
|
let opers = [oper id trm | (trm,(_,id)) <- list]
|
||||||
|
mapM mkOne $ opers ++ lins
|
||||||
|
where
|
||||||
|
|
||||||
|
mkOne (f,def) = (f,def {jdef = recomp f (jdef def)})
|
||||||
|
recomp f t = case Map.lookup t tree of
|
||||||
|
Just (_,id) | ident id /= f -> return $ Q mo (ident id)
|
||||||
|
_ -> C.composOp (recomp f) t
|
||||||
|
|
||||||
|
list = Map.toList tree
|
||||||
|
|
||||||
|
oper id trm = (ident id, resOper (EInt 8) (Yes trm))
|
||||||
|
--- impossible type encoding generated opers
|
||||||
|
|
||||||
|
getSubtermsMod :: Ident -> [(Ident,Judgement)] -> TermM (Map Term (Int,Int))
|
||||||
|
getSubtermsMod mo js = do
|
||||||
|
mapM (getInfo (collectSubterms mo)) js
|
||||||
|
(tree0,_) <- readSTM
|
||||||
|
return $ Map.filter (\ (nu,_) -> nu > 1) tree0
|
||||||
|
where
|
||||||
|
getInfo get fi@(f,i) = do
|
||||||
|
get (jdef i)
|
||||||
|
return $ fi
|
||||||
|
|
||||||
|
collectSubterms :: Ident -> Term -> TermM Term
|
||||||
|
collectSubterms mo t = case t of
|
||||||
|
App f a -> do
|
||||||
|
collect f
|
||||||
|
collect a
|
||||||
|
add t
|
||||||
|
T ty cs -> do
|
||||||
|
let (_,ts) = unzip cs
|
||||||
|
mapM collect ts
|
||||||
|
add t
|
||||||
|
V ty ts -> do
|
||||||
|
mapM collect ts
|
||||||
|
add t
|
||||||
|
---- K (KP _ _) -> add t
|
||||||
|
_ -> C.composOp (collectSubterms mo) t
|
||||||
|
where
|
||||||
|
collect = collectSubterms mo
|
||||||
|
add t = do
|
||||||
|
(ts,i) <- readSTM
|
||||||
|
let
|
||||||
|
((count,id),next) = case Map.lookup t ts of
|
||||||
|
Just (nu,id) -> ((nu+1,id), i)
|
||||||
|
_ -> ((1, i ), i+1)
|
||||||
|
writeSTM (Map.insert t (count,id) ts, next)
|
||||||
|
return t --- only because of composOp
|
||||||
|
|
||||||
|
ident :: Int -> Ident
|
||||||
|
ident i = identC ("_A" ++ show i) ---
|
||||||
|
|
||||||
Reference in New Issue
Block a user