mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-05-05 01:02:51 -06:00
52 lines
1.4 KiB
Haskell
52 lines
1.4 KiB
Haskell
----------------------------------------------------------------------
|
|
-- |
|
|
-- Module : (Module)
|
|
-- Maintainer : (Maintainer)
|
|
-- Stability : (stable)
|
|
-- Portability : (portable)
|
|
--
|
|
-- > CVS $Date $
|
|
-- > CVS $Author $
|
|
-- > CVS $Revision $
|
|
--
|
|
-- (Description of the module)
|
|
-----------------------------------------------------------------------------
|
|
|
|
module Unlex where
|
|
|
|
import Operations
|
|
import Str
|
|
|
|
import Char
|
|
import List (isPrefixOf)
|
|
|
|
-- elementary text postprocessing. AR 21/11/2001
|
|
|
|
formatAsText :: String -> String
|
|
formatAsText = unwords . format . cap . words where
|
|
format ws = case ws of
|
|
w : c : ww | major c -> (w ++ c) : format (cap ww)
|
|
w : c : ww | minor c -> (w ++ c) : format ww
|
|
c : ww | para c -> "\n\n" : format ww
|
|
w : ww -> w : format ww
|
|
[] -> []
|
|
cap (p:(c:cs):ww) | para p = p : (toUpper c : cs) : ww
|
|
cap ((c:cs):ww) = (toUpper c : cs) : ww
|
|
cap [] = []
|
|
major = flip elem (map (:[]) ".!?")
|
|
minor = flip elem (map (:[]) ",:;")
|
|
para = (=="&-")
|
|
|
|
unlex :: [Str] -> String
|
|
unlex = formatAsText . performBinds . concat . map sstr . take 1 ----
|
|
|
|
-- modified from GF/src/Text by adding hyphen
|
|
performBinds :: String -> String
|
|
performBinds = unwords . format . words where
|
|
format ws = case ws of
|
|
w : "-" : u : ws -> format ((w ++ "-" ++ u) : ws)
|
|
w : "&+" : u : ws -> format ((w ++ u) : ws)
|
|
w : ws -> w : format ws
|
|
[] -> []
|
|
|