mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-04-25 20:42:50 -06:00
Founding the newly structured GF2.0 cvs archive.
This commit is contained in:
56
src/GF/Text/Text.hs
Normal file
56
src/GF/Text/Text.hs
Normal file
@@ -0,0 +1,56 @@
|
||||
module Text where
|
||||
|
||||
import Operations
|
||||
import Char
|
||||
|
||||
-- elementary text postprocessing. AR 21/11/2001
|
||||
-- This is very primitive indeed. The functions should work on
|
||||
-- token lists and not on strings. AR 5/12/2002
|
||||
|
||||
|
||||
formatAsTextLit :: String -> String
|
||||
formatAsTextLit = formatAsText . unwords . map unStringLit . words
|
||||
--- hope that there will be deforestation...
|
||||
|
||||
formatAsCodeLit :: String -> String
|
||||
formatAsCodeLit = formatAsCode . unwords . map unStringLit . words
|
||||
|
||||
formatAsText :: String -> String
|
||||
formatAsText = unwords . format . cap . words where
|
||||
format ws = case ws of
|
||||
w : c : ww | major c -> (w ++ c) : format (cap ww)
|
||||
w : c : ww | minor c -> (w ++ c) : format ww
|
||||
c : ww | para c -> "\n\n" : format ww
|
||||
w : ww -> w : format ww
|
||||
[] -> []
|
||||
cap (p:(c:cs):ww) | para p = p : (toUpper c : cs) : ww
|
||||
cap ((c:cs):ww) = (toUpper c : cs) : ww
|
||||
cap [] = []
|
||||
major = flip elem (map singleton ".!?")
|
||||
minor = flip elem (map singleton ",:;")
|
||||
para = (=="<p>")
|
||||
|
||||
formatAsCode :: String -> String
|
||||
formatAsCode = unwords . format . words where
|
||||
format ws = case ws of
|
||||
p : w : ww | parB p -> format ((p ++ w') : ww') where (w':ww') = format (w:ww)
|
||||
w : p : ww | par p -> format ((w ++ p') : ww') where (p':ww') = format (p:ww)
|
||||
w : ww -> w : format ww
|
||||
[] -> []
|
||||
parB = flip elem (map singleton "([{")
|
||||
parE = flip elem (map singleton "}])")
|
||||
par t = parB t || parE t
|
||||
|
||||
performBinds :: String -> String
|
||||
performBinds = unwords . format . words where
|
||||
format ws = case ws of
|
||||
w : "&+" : u : ws -> format ((w ++ u) : ws)
|
||||
w : ws -> w : format ws
|
||||
[] -> []
|
||||
|
||||
unStringLit :: String -> String
|
||||
unStringLit s = case s of
|
||||
c : cs | strlim c && strlim (last cs) -> init cs
|
||||
_ -> s
|
||||
where
|
||||
strlim = (=='\'')
|
||||
Reference in New Issue
Block a user