mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-04-19 09:49:33 -06:00
PGF exports the public, stable API. PGF.Internal exports additional things needed in the GF compiler & shell, including the nonstardard version of Data.Binary.
209 lines
6.0 KiB
Haskell
209 lines
6.0 KiB
Haskell
----------------------------------------------------------------------
|
|
-- |
|
|
-- Module : Ident
|
|
-- Maintainer : AR
|
|
-- Stability : (stable)
|
|
-- Portability : (portable)
|
|
--
|
|
-- > CVS $Date: 2005/11/15 11:43:33 $
|
|
-- > CVS $Author: aarne $
|
|
-- > CVS $Revision: 1.8 $
|
|
--
|
|
-- (Description of the module)
|
|
-----------------------------------------------------------------------------
|
|
|
|
module GF.Infra.Ident (-- * Identifiers
|
|
Ident, ident2utf8, showIdent, ppIdent, prefixIdent,
|
|
identS, identC, identV, identA, identAV, identW,
|
|
argIdent, isArgIdent, getArgIndex,
|
|
varStr, varX, isWildIdent, varIndex,
|
|
-- * Raw Identifiers
|
|
RawIdent, rawIdentS, rawIdentC, ident2raw, prefixRawIdent,
|
|
isPrefixOf, showRawIdent{-,
|
|
-- * Refreshing identifiers
|
|
IdState, initIdStateN, initIdState,
|
|
lookVar, refVar, refVarPlus-}
|
|
) where
|
|
|
|
import qualified Data.ByteString.UTF8 as UTF8
|
|
import qualified Data.ByteString.Char8 as BS(append,isPrefixOf)
|
|
-- Limit use of BS functions to the ones that work correctly on
|
|
-- UTF-8-encoded bytestrings!
|
|
import Data.Char(isDigit)
|
|
import PGF.Internal(Binary(..))
|
|
import Text.PrettyPrint(Doc,text)
|
|
|
|
|
|
-- | the constructors labelled /INTERNAL/ are
|
|
-- internal representation never returned by the parser
|
|
data Ident =
|
|
IC {-# UNPACK #-} !RawIdent -- ^ raw identifier after parsing, resolved in Rename
|
|
| IW -- ^ wildcard
|
|
--
|
|
-- below this constructor: internal representation never returned by the parser
|
|
| IV {-# UNPACK #-} !RawIdent {-# UNPACK #-} !Int -- ^ /INTERNAL/ variable
|
|
| IA {-# UNPACK #-} !RawIdent {-# UNPACK #-} !Int -- ^ /INTERNAL/ argument of cat at position
|
|
| IAV {-# UNPACK #-} !RawIdent {-# UNPACK #-} !Int {-# UNPACK #-} !Int -- ^ /INTERNAL/ argument of cat with bindings at position
|
|
--
|
|
deriving (Eq, Ord, Show, Read)
|
|
|
|
-- | Identifiers are stored as UTF-8-encoded bytestrings.
|
|
newtype RawIdent = Id { rawId2utf8 :: UTF8.ByteString }
|
|
deriving (Eq, Ord, Show, Read)
|
|
|
|
pack = UTF8.fromString
|
|
unpack = UTF8.toString
|
|
|
|
rawIdentS = Id . pack
|
|
rawIdentC = Id
|
|
showRawIdent = unpack . rawId2utf8
|
|
|
|
prefixRawIdent (Id x) (Id y) = Id (BS.append x y)
|
|
isPrefixOf (Id x) (Id y) = BS.isPrefixOf x y
|
|
|
|
instance Binary RawIdent where
|
|
put = put . rawId2utf8
|
|
get = fmap rawIdentC get
|
|
|
|
|
|
-- | This function should be used with care, since the returned ByteString is
|
|
-- UTF-8-encoded.
|
|
ident2utf8 :: Ident -> UTF8.ByteString
|
|
ident2utf8 i = case i of
|
|
IC (Id s) -> s
|
|
IV (Id s) n -> BS.append s (pack ('_':show n))
|
|
IA (Id s) j -> BS.append s (pack ('_':show j))
|
|
IAV (Id s) b j -> BS.append s (pack ('_':show b ++ '_':show j))
|
|
IW -> pack "_"
|
|
|
|
ident2raw = Id . ident2utf8
|
|
|
|
showIdent :: Ident -> String
|
|
showIdent i = unpack $! ident2utf8 i
|
|
|
|
ppIdent :: Ident -> Doc
|
|
ppIdent = text . showIdent
|
|
|
|
identS :: String -> Ident
|
|
identS = identC . rawIdentS
|
|
|
|
identC :: RawIdent -> Ident
|
|
identV :: RawIdent -> Int -> Ident
|
|
identA :: RawIdent -> Int -> Ident
|
|
identAV:: RawIdent -> Int -> Int -> Ident
|
|
identW :: Ident
|
|
(identC, identV, identA, identAV, identW) =
|
|
(IC, IV, IA, IAV, IW)
|
|
|
|
|
|
prefixIdent :: String -> Ident -> Ident
|
|
prefixIdent pref = identC . Id . BS.append (pack pref) . ident2utf8
|
|
|
|
-- normal identifier
|
|
-- ident s = IC s
|
|
|
|
-- | to mark argument variables
|
|
argIdent :: Int -> Ident -> Int -> Ident
|
|
argIdent 0 (IC c) i = identA c i
|
|
argIdent b (IC c) i = identAV c b i
|
|
|
|
isArgIdent IA{} = True
|
|
isArgIdent IAV{} = True
|
|
isArgIdent _ = False
|
|
|
|
getArgIndex (IA _ i) = Just i
|
|
getArgIndex (IAV _ _ i) = Just i
|
|
getArgIndex (IC (Id bs))
|
|
| isDigit c =
|
|
-- (Just . read . unpack . snd . BS.spanEnd isDigit) bs -- not ok with UTF-8
|
|
(Just . read . reverse . takeWhile isDigit) s
|
|
where s@(c:_) = reverse (unpack bs)
|
|
getArgIndex x = Nothing
|
|
|
|
-- | used in lin defaults
|
|
varStr :: Ident
|
|
varStr = identA (rawIdentS "str") 0
|
|
|
|
-- | refreshing variables
|
|
varX :: Int -> Ident
|
|
varX = identV (rawIdentS "x")
|
|
|
|
isWildIdent :: Ident -> Bool
|
|
isWildIdent x = case x of
|
|
IW -> True
|
|
IC s | s == wild -> True
|
|
_ -> False
|
|
|
|
wild = Id (pack "_")
|
|
|
|
varIndex :: Ident -> Int
|
|
varIndex (IV _ n) = n
|
|
varIndex _ = -1 --- other than IV should not count
|
|
|
|
{-
|
|
-- * Refreshing identifiers
|
|
|
|
type IdState = ([(Ident,Ident)],Int)
|
|
|
|
initIdStateN :: Int -> IdState
|
|
initIdStateN i = ([],i)
|
|
|
|
initIdState :: IdState
|
|
initIdState = initIdStateN 0
|
|
|
|
lookVar :: Ident -> STM IdState Ident
|
|
lookVar a@(IA _ _) = return a
|
|
lookVar x = do
|
|
(sys,_) <- readSTM
|
|
stm (\s -> maybe (Bad ("cannot find" +++ show x +++ prParenth (show sys)))
|
|
return $
|
|
lookup x sys >>= (\y -> return (y,s)))
|
|
|
|
refVar :: Ident -> STM IdState Ident
|
|
----refVar IW = return IW --- no update of wildcard
|
|
refVar x = do
|
|
(_,m) <- readSTM
|
|
let x' = IV (ident2raw x) m
|
|
updateSTM (\(sys,mx) -> ((x, x'):sys, mx + 1))
|
|
return x'
|
|
|
|
refVarPlus :: Ident -> STM IdState Ident
|
|
----refVarPlus IW = refVar (identC "h")
|
|
refVarPlus x = refVar x
|
|
-}
|
|
|
|
{-
|
|
------------------------------
|
|
-- to test
|
|
|
|
refreshExp :: Exp -> Err Exp
|
|
refreshExp e = err Bad (return . fst) (appSTM (refresh e) initState)
|
|
|
|
refresh :: Exp -> STM State Exp
|
|
refresh e = case e of
|
|
Atom x -> lookVar x >>= return . Atom
|
|
App f a -> liftM2 App (refresh f) (refresh a)
|
|
Abs x b -> liftM2 Abs (refVar x) (refresh b)
|
|
Fun xs a b -> do
|
|
a' <- refresh a
|
|
xs' <- mapM refVar xs
|
|
b' <- refresh b
|
|
return $ Fun xs' a' b'
|
|
|
|
data Exp =
|
|
Atom Ident
|
|
| App Exp Exp
|
|
| Abs Ident Exp
|
|
| Fun [Ident] Exp Exp
|
|
deriving Show
|
|
|
|
exp1 = Abs (IC "y") (Atom (IC "y"))
|
|
exp2 = Abs (IC "y") (App (Atom (IC "y")) (Atom (IC "y")))
|
|
exp3 = Abs (IC "y") (Abs (IC "z") (App (Atom (IC "y")) (Atom (IC "z"))))
|
|
exp4 = Abs (IC "y") (Abs (IC "y") (App (Atom (IC "y")) (Atom (IC "z"))))
|
|
exp5 = Abs (IC "y") (Abs (IC "y") (App (Atom (IC "y")) (Atom (IC "y"))))
|
|
exp6 = Abs (IC "y") (Fun [IC "x", IC "y"] (Atom (IC "y")) (Atom (IC "y")))
|
|
exp7 = Abs (IL "8") (Atom (IC "y"))
|
|
|
|
-}
|