mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-04-23 11:42:49 -06:00
visualization of word alignment based on bracketing (command aw); does not work for syncategorematic words yet
This commit is contained in:
@@ -104,6 +104,41 @@ allCommands cod env@(pgf, mos) = Map.fromList [
|
|||||||
"gt | l | ? wc -- generate, linearize, word-count"
|
"gt | l | ? wc -- generate, linearize, word-count"
|
||||||
]
|
]
|
||||||
}),
|
}),
|
||||||
|
|
||||||
|
("aw", emptyCommandInfo {
|
||||||
|
longname = "align_words",
|
||||||
|
synopsis = "show word alignments between languages graphically",
|
||||||
|
explanation = unlines [
|
||||||
|
"Prints a set of strings in the .dot format (the graphviz format).",
|
||||||
|
"The graph can be saved in a file by the wf command as usual.",
|
||||||
|
"If the -view flag is defined, the graph is saved in a temporary file",
|
||||||
|
"which is processed by graphviz and displayed by the program indicated",
|
||||||
|
"by the flag. The target format is postscript, unless overridden by the",
|
||||||
|
"flag -format."
|
||||||
|
],
|
||||||
|
exec = \opts ts -> do
|
||||||
|
let grph = if null ts then [] else alignLinearize pgf (head ts)
|
||||||
|
if isFlag "view" opts || isFlag "format" opts then do
|
||||||
|
let file s = "_grph." ++ s
|
||||||
|
let view = optViewGraph opts ++ " "
|
||||||
|
let format = optViewFormat opts
|
||||||
|
writeFile (file "dot") (enc grph)
|
||||||
|
system $ "dot -T" ++ format ++ " " ++ file "dot" ++ " > " ++ file format ++
|
||||||
|
" ; " ++ view ++ file format
|
||||||
|
return void
|
||||||
|
else return $ fromString grph,
|
||||||
|
examples = [
|
||||||
|
"gr | aw -- generate a tree and show word alignment as graph script",
|
||||||
|
"gr | vt -view=\"open\" -- generate a tree and display alignment on a Mac"
|
||||||
|
],
|
||||||
|
options = [
|
||||||
|
],
|
||||||
|
flags = [
|
||||||
|
("format","format of the visualization file (default \"ps\")"),
|
||||||
|
("view","program to open the resulting file (default \"gv\")")
|
||||||
|
]
|
||||||
|
}),
|
||||||
|
|
||||||
("cc", emptyCommandInfo {
|
("cc", emptyCommandInfo {
|
||||||
longname = "compute_concrete",
|
longname = "compute_concrete",
|
||||||
syntax = "cc (-all | -table | -unqual)? TERM",
|
syntax = "cc (-all | -table | -unqual)? TERM",
|
||||||
|
|||||||
@@ -146,10 +146,11 @@ linTreeMark pgf lang = lin []
|
|||||||
R ts -> R $ map (mark p) ts
|
R ts -> R $ map (mark p) ts
|
||||||
FV ts -> R $ map (mark p) ts
|
FV ts -> R $ map (mark p) ts
|
||||||
S ts -> S $ bracket p ts
|
S ts -> S $ bracket p ts
|
||||||
K s -> S $ bracket p [t]
|
K s -> S $ bracketw p [t]
|
||||||
W s (R ts) -> R [mark p $ kks (s ++ u) | K (KS u) <- ts]
|
W s (R ts) -> R [mark p $ kks (s ++ u) | K (KS u) <- ts]
|
||||||
_ -> t
|
_ -> t
|
||||||
-- otherwise in normal form
|
-- otherwise in normal form
|
||||||
|
|
||||||
bracket p ts = [kks ("["++show p)] ++ ts ++ [kks "]"]
|
bracket p ts = [kks ("("++show p)] ++ ts ++ [kks ")"]
|
||||||
|
bracketw p ts = [kks ("{"++show p)] ++ ts ++ [kks "}"] -- for easy word alignment
|
||||||
sub p i = p ++ [i]
|
sub p i = p ++ [i]
|
||||||
|
|||||||
@@ -15,13 +15,16 @@
|
|||||||
-- instead of rolling its own.
|
-- instead of rolling its own.
|
||||||
-----------------------------------------------------------------------------
|
-----------------------------------------------------------------------------
|
||||||
|
|
||||||
module PGF.VisualizeTree ( visualizeTrees
|
module PGF.VisualizeTree ( visualizeTrees, alignLinearize
|
||||||
) where
|
) where
|
||||||
|
|
||||||
import PGF.CId (prCId)
|
import PGF.CId (prCId)
|
||||||
import PGF.Data
|
import PGF.Data
|
||||||
|
import PGF.Linearize
|
||||||
import PGF.Macros (lookValCat)
|
import PGF.Macros (lookValCat)
|
||||||
|
|
||||||
|
import Data.List (intersperse)
|
||||||
|
|
||||||
visualizeTrees :: PGF -> (Bool,Bool) -> [Tree] -> String
|
visualizeTrees :: PGF -> (Bool,Bool) -> [Tree] -> String
|
||||||
visualizeTrees pgf funscats = unlines . map (prGraph False . tree2graph pgf funscats)
|
visualizeTrees pgf funscats = unlines . map (prGraph False . tree2graph pgf funscats)
|
||||||
|
|
||||||
@@ -46,3 +49,73 @@ tree2graph pgf (funs,cats) = prf [] where
|
|||||||
|
|
||||||
prGraph digr ns = concat $ map (++"\n") $ [graph ++ "{\n"] ++ ns ++ ["}"] where
|
prGraph digr ns = concat $ map (++"\n") $ [graph ++ "{\n"] ++ ns ++ ["}"] where
|
||||||
graph = if digr then "digraph" else "graph"
|
graph = if digr then "digraph" else "graph"
|
||||||
|
|
||||||
|
|
||||||
|
-- word alignments from Linearize.linearizesMark
|
||||||
|
-- words are chunks like {[0,1,1,0] old}
|
||||||
|
|
||||||
|
alignLinearize :: PGF -> Tree -> String
|
||||||
|
alignLinearize pgf = prGraph True . lin2graph . linsMark where
|
||||||
|
linsMark t = [s | la <- cncnames pgf, s <- take 1 (linearizesMark pgf la t)]
|
||||||
|
|
||||||
|
lin2graph :: [String] -> [String]
|
||||||
|
lin2graph ss = prelude ++ nodes ++ links
|
||||||
|
|
||||||
|
where
|
||||||
|
|
||||||
|
prelude = ["rankdir=LR ;", "node [shape = record] ;"]
|
||||||
|
|
||||||
|
-- find all words
|
||||||
|
lins :: String -> [(String,String)]
|
||||||
|
lins [] = []
|
||||||
|
lins s = let (s1, s2) = if null s then ([],[]) else span (/='{') s in
|
||||||
|
let (s21,s22) = if null s2 then ([],[]) else span (/='}') (tail s2) in
|
||||||
|
if null s21 then lins s22 else wlink s21 : lins s22
|
||||||
|
|
||||||
|
-- separate a word to the link (1,2,3) and the word itself
|
||||||
|
wlink :: String -> (String,String)
|
||||||
|
wlink s = let (s1, s2) = span (/=']') s in
|
||||||
|
(tail s1, init (drop 1 s2))
|
||||||
|
|
||||||
|
-- make all marks unique to deal with discontinuities
|
||||||
|
nlins :: [(Int,[((Int,String),String)])]
|
||||||
|
nlins = [(i, [((j,m),w) | (j,(m,w)) <- zip [0..] (lins s)]) | (i,s) <- zip [0..] ss]
|
||||||
|
|
||||||
|
nodes = map mkStruct nlins
|
||||||
|
|
||||||
|
mkStruct (i, ws) = struct i ++ "[label = \"" ++ fields ws ++ "\"] ;"
|
||||||
|
|
||||||
|
fields ws = concat (intersperse "|" [tag (mark m) ++ " " ++ w | (m,w) <- ws])
|
||||||
|
|
||||||
|
struct i = "struct" ++ show i
|
||||||
|
|
||||||
|
mark (j,n) = "n" ++ show j ++ "a" ++ uncommas n
|
||||||
|
|
||||||
|
uncommas = map (\c -> if c==',' then 'c' else c)
|
||||||
|
|
||||||
|
tag s = "<" ++ s ++ ">"
|
||||||
|
|
||||||
|
links = concatMap mkEdge (init nlins)
|
||||||
|
|
||||||
|
mkEdge (i,lin) = let lin' = snd (nlins !! (i+1)) in -- next lin in the list
|
||||||
|
[edge i v w | (v@(_,p),_) <- lin, (w@(_,q),_) <- lin', p == q]
|
||||||
|
|
||||||
|
edge i v w =
|
||||||
|
struct i ++ ":" ++ mark v ++ " -> " ++ struct (i+1) ++ ":" ++ mark w ++ " ;"
|
||||||
|
|
||||||
|
{-
|
||||||
|
digraph{
|
||||||
|
rankdir ="LR" ;
|
||||||
|
node [shape = record] ;
|
||||||
|
|
||||||
|
struct1 [label = "<f0> this|<f1> very|<f2> intelligent|<f3> man"] ;
|
||||||
|
struct2 [label = "<f0> cet|<f1> homme|<f2> tres|<f3> intelligent|<f4> ci"] ;
|
||||||
|
|
||||||
|
struct1:f0 -> struct2:f0 ;
|
||||||
|
struct1:f1 -> struct2:f2 ;
|
||||||
|
struct1:f2 -> struct2:f3 ;
|
||||||
|
struct1:f3 -> struct2:f1 ;
|
||||||
|
struct1:f0 -> struct2:f4 ;
|
||||||
|
}
|
||||||
|
-}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user