started MiniresourceSan ; doesn't compile yet

2013-05-31 08:00:09 +00:00
parent aa644169c2
commit 0ede1365dc
1 changed files with 268 additions and 0 deletions
@@ -0,0 +1,268 @@
+concrete MiniresourceSan of Miniresource = open Prelude in {
+
+-- module GrammarSan
+
+  flags coding = utf8;
+
+  lincat
+    S   = {s : Str} ; 
+    Cl = {s : Bool => Str} ; 
+    NP = NounPhrase ;  
+      -- {s : Str} ;     
+    VP = VerbPhrase ;  
+      -- {verb : Verb ; compl : Str} ;  
+    AP = {s : Str; monoSyl: Bool} ;
+    CN = Noun ;        -- {s : Str; c : Str} ;
+    Det = {s : Str ; n : Number} ;
+    N = Noun ;         -- {s : Str; c : Str} ;
+    A = Adj ;          -- {s : Str; monoSyl: Bool} ; 
+    V = Verb;          -- {s : Str ; pp,ds,dp,ep : Str ; neg : Str}
+    V2 = Verb ;
+    AdA = {s : Str} ; 
+    Pol = {s : Str ; b : Bool} ;
+    Tense = {s : Str} ;
+    Conj = {s : SForm => Str} ;    
+
+  lin
+    UseCl t p cl = {s = t.s ++ p.s ++ cl.s ! p.b} ; 
+
+    PredVP np vp = {
+       s  = \\p => np.s ++ neg p ++ vp.verb.s ++ vp.compl
+       } ;
+
+    ComplV2 v2 np = {
+     verb  = v2 ;
+     compl = np.s
+     } ; 
+
+    UseV v = {
+      verb = v ; 
+      compl = []
+      } ; 
+
+    DetCN det cn = case det.n of {
+            Sg => {s = det.s ++ cn.c ++ cn.s ; n = Sg } ;
+            Pl => {s = det.s ++ "些" ++ cn.s ; n = Pl }             
+      } ;
+      
+    ModCN ap cn = case ap.monoSyl of {
+            True => {s = ap.s ++ cn.s ; c = cn.c} ;
+            False => {s = ap.s ++ "的" ++ cn.s ; c = cn.c} 
+            } ;
+
+    CompAP ap = {
+      verb = copula ;
+      compl = ap.s ++ "的"
+      } ;
+
+    AdAP ada ap = {
+      s = ada.s ++ ap.s ;
+      monoSyl = False
+      } ;
+
+    ConjNP co x y = {
+      s = x.s ++ co.s ! Phr NPhrase ++ y.s
+      } ;
+
+    ConjS  co x y = {s = x.s ++ co.s ! Sent ++ y.s} ;  
+
+    UseN n = n ;
+    UseA adj = adj ;
+
+    a_Det = mkDet "一" Sg ;
+    every_Det = mkDet "每" Sg ;        
+    the_Det = mkDet "那" Sg ;
+
+    this_Det = mkDet "这" Sg ;
+    these_Det = mkDet "这" Pl ;
+    that_Det = mkDet "那" Sg ;
+    those_Det = mkDet "那" Pl ;
+
+    i_NP = pronNP "我" ;
+    youSg_NP = pronNP "你" ;
+    he_NP = pronNP "他" ;
+    she_NP = pronNP "她" ;
+    we_NP = pronNP "我们" ;
+    youPl_NP = pronNP "你们" ;
+    they_NP = pronNP "他们" ;
+
+    very_AdA = ss (word "非常") ;    
+    
+    and_Conj = {s = table {
+                    Phr NPhrase => "和" ;
+                    Phr APhrase => "而" ;
+                    Phr VPhrase => "又" ;
+                    Sent =>  []
+                          }
+                } ;
+
+    or_Conj  = {s = table {
+                    Phr _ => "或" ;
+                    Sent => word "还是"
+                          }
+                } ;
+
+    Pos  = {s = [] ; b = True} ;
+    Neg  = {s = [] ; b = False} ;
+    Pres = {s = []} ;
+    Perf = {s = []} ;
+
+-- module TestChi
+
+lin
+  man_N = mkN "男人" ;  
+  woman_N = mkN "女人" ;
+  house_N = mkN "房子" ;
+  tree_N = mkN "树" "棵";
+  big_A = mkA "大" ;
+  small_A = mkA "小" ;
+  green_A = mkA "绿" ;
+  walk_V = mkV "走" ;
+  arrive_V = mkV "到" ;
+  love_V2 = mkV2 "爱" ;
+  please_V2 = mkV2 "麻烦" ;
+
+-- module ResSan
+
+-- parameters
+
+param
+    Number = Sg | Dl | Pl ;
+    Case = Nom | Acc | Ins | Dat | Abl | Gen | Loc | Voc ;
+    Gender = Masc | Fem | Neutr ;
+    Person = P3 | P2 | P1 ;
+
+    Agr = Ag Gender Number Person ;
+
+    VForm = VPres Number Person ;
+
+-- parts of speech
+
+oper
+
+  VerbPhrase = {verb : Verb ; compl : Str} ;
+  NounPhrase = {s : Case => Str ; a : Agr} ; 
+
+-- for morphology
+
+  Noun : Type = {s : Number => Case => Str; g : Gender} ;
+  Adj  : Type = {s : Gender => Number => Case => Str} ;
+  Verb : Type = {s : VForm => Str} ;
+
+  mkNoun : (s1,_,_,_,_,_,_,_, _,_,_, _,_,_,_,_,s17 : Str) -> Gender -> Noun = 
+    \snon,sacc,sins,sdat,sabl,sgen,sloc,svoc,
+     dnomaccvoc,dinsdatabl,dgenloc,
+     pnomvoc,pacc,pins,pdatabl,pgen,ploc, 
+     gen -> {
+      s = table {
+        Sg => table {
+           Nom => snom ; Acc => sacc ; Ins => sins ; Dat => sdat ; Abl => sabl ; Gen => sgen ; Loc => sloc ; Voc => svoc
+           } ;
+        Dl => table {
+           Nom | Voc => dnomaccvoc ; Ins | Dat | Abl => dinsdatabl ; Gen | Loc => dgenloc 
+           } ;
+        Pl => table {
+           Nom | Voc => pnomvoc ; Acc => pacc ; Ins => pins ; Dat | Abl => pdatabl ; Gen => pgen ; Loc => ploc
+           }
+        } ;
+      g = gen
+      } ;
+
+  endingNoun : Str -> (s1,_,_,_,_,_,_,_, _,_,_, _,_,_,_,_,s17 : Str) -> Gender -> Noun = 
+    \stem,
+     snon,sacc,sins,sdat,sabl,sgen,sloc,svoc,
+     dnomaccvoc,dinsdatabl,dgenloc,
+     pnomvoc,pacc,pins,pdatabl,pgen,ploc, 
+     gen -> 
+       mkNoun
+         (stemm + snon) (stem + sacc) (stem + sins) (stem + sdat) (stem + sabl) (stem + sgen) (stem + sloc) (stem + svoc) 
+         (stem + dnomaccvoc) (stem + dinsdatabl) (stem + dgenloc) 
+         (stem + pnomvoc) (stem + pacc) (stem + pins) (stem + pdatabl) (stem + pgen) (stem + ploc) 
+         gen ;
+
+
+  ramaNoun : Str -> Noun = \rama ->
+    let ram = init rama in
+    endingNoun ram
+      "aH" "amx" "eNe" "a:ya" "a:tx" "asxya" "e" "a"
+      "o+" "a:t'xya:mx" "ayo:" 
+      "a:H" "a:nx" "e+H" "e:t'yaH" "a:Na:ma" "e:Su" 
+      Masc ;
+
+  mkVerb : (s1,_,_,_,_,_,_,_,s9 : Str) -> Verb = 
+    \s3,s2,s1,d3,d2,d1,p3,p2,p1 -> {
+      s = table {
+        VPres Sg P3 => s3 ;
+        VPres Sg P2 => s2 ;
+        VPres Sg P1 => s1 ;
+        VPres Dl P3 => d3 ;
+        VPres Dl P2 => d2 ;
+        VPres Dl P1 => d1 ;
+        VPres Pl P3 => p3 ;
+        VPres Pl P2 => p2 ;
+        VPres Pl P1 => p1
+        }
+      } ;
+
+  endingVerb : Str -> (s1,_,_,_,_,_,_,_,s9 : Str) -> Verb = 
+    \stem,s3,s2,s1,d3,d2,d1,p3,p2,p1 -> 
+      mkVerb
+        (stem + s3) (stem + s2) (stem + s1) (stem + d3) (stem + d2) (stem + d1) (stem + p3) (stem + p2) (stem + p1) ;
+
+  patVerb : Str -> Verb = \pat ->
+    endingVerb pat
+      "ita" "isa" "ima" "ataH" "at'aH" "avaH" "inxta" "at'a" "a:maH" ;
+
+
+{-
+  neg : Bool -> Str = \b -> case b of {True => [] ; False => "不"} ;
+
+-- for structural words
+
+  mkDet : Str -> Number -> {s : Str ; n : Number} = \s,n -> {
+    s = word s ;
+    n = n
+    } ;
+
+  pronNP : (s : Str) -> NounPhrase = \s -> {
+    s = word s
+    } ;
+    
+-- Write the characters that constitute a word separately. 
+-- This enables straightforward tokenization.
+
+  bword : Str -> Str -> Str = \x,y -> x ++ y ; 
+  -- change to x + y to treat words as single tok ens
+
+  word : Str -> Str = \s -> case s of {
+      x@? + y@? + z@? + u@? => bword x (bword y (bword z u)) ;
+      x@? + y@? + z@? => bword x (bword y z) ;
+      x@? + y@? => bword x y ;
+      _ => s
+      } ;
+
+-- module ParadigmsChi
+
+oper
+  mkN = overload {
+    mkN : (man : Str) -> N 
+      = \n -> lin N (mkNoun n "个") ;  
+    mkN : (man : Str) -> Str -> N 
+      = \n,c -> lin N (mkNoun n c)
+    } ;  
+      
+  mkA : (small : Str) -> A 
+      = \a -> lin A (mkAdj a) ;
+      
+  mkV : (walk : Str) -> V 
+      = \s -> lin V (mkVerb s) ; 
+
+  mkV2 = overload {
+    mkV2 : (love : Str) -> V2 
+      = \love -> lin V2 (mkVerb love) ;
+    mkV2 : (love : V) -> V2 
+      = \love -> lin V2 love ;
+   } ;
+-}
+
+}