mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-05-20 08:32:50 -06:00
preliminary version of morpho analysis
This commit is contained in:
@@ -14,6 +14,7 @@ import PGF.CId
|
|||||||
import PGF.ShowLinearize
|
import PGF.ShowLinearize
|
||||||
import PGF.Macros
|
import PGF.Macros
|
||||||
import PGF.Data ----
|
import PGF.Data ----
|
||||||
|
import PGF.Morphology
|
||||||
import GF.Compile.Export
|
import GF.Compile.Export
|
||||||
import GF.Infra.UseIO
|
import GF.Infra.UseIO
|
||||||
import GF.Data.ErrM ----
|
import GF.Data.ErrM ----
|
||||||
@@ -60,9 +61,9 @@ commandHelp full (co,info) = unlines $ [
|
|||||||
"flags: " ++ unwords (flags info)
|
"flags: " ++ unwords (flags info)
|
||||||
] else []
|
] else []
|
||||||
|
|
||||||
-- this list must be kept sorted by the command name!
|
-- this list must no more be kept sorted by the command name
|
||||||
allCommands :: PGF -> Map.Map String CommandInfo
|
allCommands :: PGF -> Map.Map String CommandInfo
|
||||||
allCommands pgf = Map.fromAscList [
|
allCommands pgf = Map.fromList [
|
||||||
("cc", emptyCommandInfo {
|
("cc", emptyCommandInfo {
|
||||||
longname = "compute_concrete",
|
longname = "compute_concrete",
|
||||||
synopsis = "computes concrete syntax term using the source grammar",
|
synopsis = "computes concrete syntax term using the source grammar",
|
||||||
@@ -144,15 +145,39 @@ allCommands pgf = Map.fromAscList [
|
|||||||
options = ["all","record","table","term"],
|
options = ["all","record","table","term"],
|
||||||
flags = ["lang"]
|
flags = ["lang"]
|
||||||
}),
|
}),
|
||||||
|
|
||||||
|
("ma", emptyCommandInfo {
|
||||||
|
longname = "morpho_analyse",
|
||||||
|
synopsis = "print the morphological analyses of all words in the string",
|
||||||
|
explanation = unlines [
|
||||||
|
"Prints all the analyses of space-separated words in the input string,",
|
||||||
|
"using the morphological analyser of the actual grammar (see command pf)"
|
||||||
|
],
|
||||||
|
exec = \opts ->
|
||||||
|
return . fromString . unlines .
|
||||||
|
map prMorphoAnalysis . concatMap (morphos opts) .
|
||||||
|
concatMap words . toStrings
|
||||||
|
}),
|
||||||
|
|
||||||
("p", emptyCommandInfo {
|
("p", emptyCommandInfo {
|
||||||
longname = "parse",
|
longname = "parse",
|
||||||
synopsis = "parse a string to abstract syntax expression",
|
synopsis = "parse a string to abstract syntax expression",
|
||||||
explanation = "Shows all trees (expressions) returned for String by the actual\n"++
|
explanation = "Shows all trees (expressions) returned for String by the actual\n"++
|
||||||
"grammar (overridden by the -lang flag), in the category S (overridden\n"++
|
"grammar (overridden by the -lang flag), in the category S (overridden\n"++
|
||||||
"by the -cat flag).",
|
"by the -cat flag).",
|
||||||
exec = \opts -> return . fromTrees . concatMap (par opts). toStrings,
|
exec = \opts -> return . fromTrees . concatMap (par opts) . toStrings,
|
||||||
flags = ["cat","lang"]
|
flags = ["cat","lang"]
|
||||||
}),
|
}),
|
||||||
|
("pf", emptyCommandInfo {
|
||||||
|
longname = "print_fullform",
|
||||||
|
synopsis = "print the full-form lexicon of the actual grammar",
|
||||||
|
explanation = unlines [
|
||||||
|
"Prints all the strings in the actual grammar with their possible analyses"
|
||||||
|
],
|
||||||
|
exec = \opts _ ->
|
||||||
|
return $ fromString $ concatMap
|
||||||
|
(prFullFormLexicon . buildMorpho pgf . mkCId) $ optLangs opts
|
||||||
|
}),
|
||||||
("pg", emptyCommandInfo {
|
("pg", emptyCommandInfo {
|
||||||
longname = "print_grammar",
|
longname = "print_grammar",
|
||||||
synopsis = "print the actual grammar with the given printer",
|
synopsis = "print the actual grammar with the given printer",
|
||||||
@@ -206,3 +231,6 @@ allCommands pgf = Map.fromAscList [
|
|||||||
prGrammar opts = case valIdOpts "printer" "" opts of
|
prGrammar opts = case valIdOpts "printer" "" opts of
|
||||||
"cats" -> unwords $ categories pgf
|
"cats" -> unwords $ categories pgf
|
||||||
v -> prPGF (read v) pgf (prCId (absname pgf))
|
v -> prPGF (read v) pgf (prCId (absname pgf))
|
||||||
|
|
||||||
|
morphos opts s =
|
||||||
|
[lookupMorpho (buildMorpho pgf (mkCId la)) s | la <- optLangs opts]
|
||||||
|
|||||||
46
src-3.0/PGF/Morphology.hs
Normal file
46
src-3.0/PGF/Morphology.hs
Normal file
@@ -0,0 +1,46 @@
|
|||||||
|
module PGF.Morphology where
|
||||||
|
|
||||||
|
import PGF.ShowLinearize
|
||||||
|
import PGF.Data
|
||||||
|
import PGF.CId
|
||||||
|
|
||||||
|
import qualified Data.Map as Map
|
||||||
|
import Data.List (intersperse)
|
||||||
|
|
||||||
|
-- these 4 definitions depend on the datastructure used
|
||||||
|
|
||||||
|
type Morpho = Map.Map String [(Lemma,Analysis)]
|
||||||
|
|
||||||
|
lookupMorpho :: Morpho -> String -> [(Lemma,Analysis)]
|
||||||
|
lookupMorpho mo s = maybe noAnalysis id $ Map.lookup s mo
|
||||||
|
|
||||||
|
buildMorpho :: PGF -> CId -> Morpho
|
||||||
|
buildMorpho pgf = Map.fromListWith (++) . collectWords pgf
|
||||||
|
|
||||||
|
prFullFormLexicon :: Morpho -> String
|
||||||
|
prFullFormLexicon mo =
|
||||||
|
unlines [w ++ " : " ++ prMorphoAnalysis ts | (w,ts) <- Map.assocs mo]
|
||||||
|
|
||||||
|
prMorphoAnalysis :: [(Lemma,Analysis)] -> String
|
||||||
|
prMorphoAnalysis lps = unlines [l ++ " " ++ p | (l,p) <- lps]
|
||||||
|
|
||||||
|
type Lemma = String
|
||||||
|
type Analysis = String
|
||||||
|
|
||||||
|
noAnalysis :: [(Lemma,Analysis)]
|
||||||
|
noAnalysis = []
|
||||||
|
|
||||||
|
collectWords :: PGF -> CId -> [(String, [(Lemma,Analysis)])]
|
||||||
|
collectWords pgf lang =
|
||||||
|
concatMap collOne
|
||||||
|
[(f,c,0) | (f,(DTyp [] c _,_)) <- Map.toList $ funs $ abstract pgf]
|
||||||
|
where
|
||||||
|
collOne (f,c,i) =
|
||||||
|
fromRec f [prCId c] (recLinearize pgf lang (EApp f (replicate i (EMeta 888))))
|
||||||
|
fromRec f v r = case r of
|
||||||
|
RR rs -> concat [fromRec f v t | (_,t) <- rs]
|
||||||
|
RT rs -> concat [fromRec f (p:v) t | (p,t) <- rs]
|
||||||
|
RFV rs -> concatMap (fromRec f v) rs
|
||||||
|
RS s -> [(s,[(prCId f,unwords (reverse v))])]
|
||||||
|
RCon c -> [] ---- inherent
|
||||||
|
|
||||||
@@ -1,4 +1,5 @@
|
|||||||
module PGF.ShowLinearize (
|
module PGF.ShowLinearize (
|
||||||
|
Record (..), recLinearize, --- used in PGF.Morphology
|
||||||
tableLinearize,
|
tableLinearize,
|
||||||
recordLinearize,
|
recordLinearize,
|
||||||
termLinearize,
|
termLinearize,
|
||||||
|
|||||||
Reference in New Issue
Block a user