gf-core/src/runtime/haskell/PGF/CId.hs

module PGF.CId (CId(..),
                mkCId, wildCId,
                readCId, showCId,

                -- utils
                utf8CId, pCId, pIdent, ppCId) where

import Control.Monad
import qualified Data.ByteString.Char8 as BS
import qualified Data.ByteString.UTF8 as UTF8
import Data.Char
import qualified Text.ParserCombinators.ReadP as RP
import qualified Text.PrettyPrint as PP


-- | An abstract data type that represents
-- identifiers for functions and categories in PGF.
newtype CId = CId BS.ByteString deriving (Eq,Ord)

wildCId :: CId
wildCId = CId (BS.singleton '_')

-- | Creates a new identifier from 'String'
mkCId :: String -> CId
mkCId s = CId (UTF8.fromString s)

-- | Creates an identifier from a UTF-8-encoded 'ByteString'
utf8CId = CId

-- | Reads an identifier from 'String'. The function returns 'Nothing' if the string is not valid identifier.
readCId :: String -> Maybe CId
readCId s = case [x | (x,cs) <- RP.readP_to_S pCId s, all isSpace cs] of
              [x] -> Just x
              _   -> Nothing

-- | Renders the identifier as 'String'
showCId :: CId -> String
showCId (CId x) =
  let raw = UTF8.toString x
  in if isIdent raw
       then raw
       else "'" ++ concatMap escape raw ++ "'"
  where
    isIdent []     = False
    isIdent (c:cs) = isIdentFirst c && all isIdentRest cs

    escape '\'' = "\\\'"
    escape '\\' = "\\\\"
    escape c    = [c]

instance Show CId where
    showsPrec _ = showString . showCId

instance Read CId where
    readsPrec _ = RP.readP_to_S pCId

pCId :: RP.ReadP CId
pCId = do s <- pIdent
          if s == "_"
            then RP.pfail
            else return (mkCId s)

pIdent :: RP.ReadP String
pIdent =
  liftM2 (:) (RP.satisfy isIdentFirst) (RP.munch isIdentRest)
  `mplus`
  do RP.char '\''
     cs <- RP.many1 insideChar
     RP.char '\''
     return cs
--  where
insideChar = RP.readS_to_P $ \s ->
  case s of
	[]             -> []
	('\\':'\\':cs) -> [('\\',cs)]
	('\\':'\'':cs) -> [('\'',cs)]
	('\\':cs)      -> []
	('\'':cs)      -> []
	(c:cs)         -> [(c,cs)]

isIdentFirst c =
  (c == '_') ||
  (c >= 'a' && c <= 'z') ||
  (c >= 'A' && c <= 'Z') ||
  (c >= '\192' && c <= '\255' && c /= '\247' && c /= '\215')
isIdentRest c =
  (c == '_') ||
  (c == '\'') ||
  (c >= '0' && c <= '9') ||
  (c >= 'a' && c <= 'z') ||
  (c >= 'A' && c <= 'Z') ||
  (c >= '\192' && c <= '\255' && c /= '\247' && c /= '\215')

ppCId :: CId -> PP.Doc
ppCId = PP.text . showCId