Estonian - the 29th complete RGL language. Copied from Kaarel Kaljurand's and Inari Listenmaa's repository in https://github.com/GF-Estonian/GF-Estonian, where later developments will continue to take place.

2026-05-12 04:32:50 -06:00 · 2013-10-18 11:45:06 +00:00
parent 02cbf49516
commit 90ee7c7288
35 changed files with 111190 additions and 1 deletions
--- a/lib/src/estonian/ParadigmsEst.gf
+++ b/lib/src/estonian/ParadigmsEst.gf
@@ -0,0 +1,786 @@
+--1 Estonian Lexical Paradigms
+--
+-- Based on the Finnish Lexical Paradigms by Aarne Ranta 2003--2008
+--
+-- This is an API to the user of the resource grammar 
+-- for adding lexical items. It gives functions for forming
+-- expressions of open categories: nouns, adjectives, verbs.
+-- 
+-- Closed categories (determiners, pronouns, conjunctions) are
+-- accessed through the resource syntax API and $Structural.gf$. 
+--
+-- The main difference with $MorphoEst.gf$ is that the types
+-- referred to are compiled resource grammar types. We have moreover
+-- had the design principle of always having existing forms, rather
+-- than stems, as string arguments of the paradigms.
+--
+-- The structure of functions for each word class $C$ is the following:
+-- there is a polymorphic constructor $mkC$, which takes one or
+-- a few arguments. In Estonian, one argument is enough in ??? % of
+-- cases in average.
+
+resource ParadigmsEst = open 
+  (Predef=Predef), 
+  Prelude, 
+  MorphoEst,
+  HjkEst,
+  CatEst
+  in {
+
+  flags optimize=noexpand ; coding=utf8;
+
+--2 Parameters 
+--
+-- To abstract over gender, number, and (some) case names, 
+-- we define the following identifiers. The application programmer
+-- should always use these constants instead of the constructors
+-- defined in $ResEst$.
+
+oper
+  Number   : Type ;
+
+  singular : Number ;
+  plural   : Number ;
+
+  Case        : Type ;
+  nominative  : Case ; -- e.g. "karp"
+  genitive    : Case ; -- e.g. "karbi"
+  partitive   : Case ; -- e.g. "karpi"
+  illative    : Case ; -- e.g. "karbisse/karpi"
+  inessive    : Case ; -- e.g. "karbis"
+  elative     : Case ; -- e.g. "karbist"
+  allative    : Case ; -- e.g. "karbile"
+  adessive    : Case ; -- e.g. "karbil"
+  ablative    : Case ; -- e.g. "karbilt"
+  translative : Case ; -- e.g. "karbiks"
+  terminative : Case ; -- e.g. "karbini"
+  essive      : Case ; -- e.g. "karbina"
+  abessive    : Case ; -- e.g. "karbita"
+  comitative  : Case ; -- e.g. "karbiga"
+
+  infDa : InfForm ; -- e.g. "lugeda"
+  infDes : InfForm ;
+  infMa : InfForm ; -- e.g. "lugema"
+  infMas : InfForm ; -- e.g. "lugemas"
+  infMaks : InfForm ; -- e.g. "lugemaks"
+  infMast : InfForm ;  -- e.g. "lugemast"
+  infMata : InfForm ; -- e.g. "lugemata"
+
+-- The following type is used for defining *rection*, i.e. complements
+-- of many-place verbs and adjective. A complement can be defined by
+-- just a case, or a pre/postposition and a case.
+
+  prePrep     : Case -> Str -> Prep ;  -- preposition, e.g. comitative "koos"
+  postPrep    : Case -> Str -> Prep ;  -- postposition, e.g. genitive "taga"
+  postGenPrep :         Str -> Prep ;  -- genitive postposition, e.g. "taga"
+  casePrep    : Case ->        Prep ;  -- just case, e.g. adessive
+
+  -- TODO build the dict 
+  NW : Type ;   -- Noun from DictEst (WordNet)
+  AW : Type ;   -- Adjective from DictEst (WordNet)
+  VW : Type ;   -- Verb from DictEst (WordNet)
+  AdvW : Type ; -- Adverb from DictEst (WordNet)
+
+--2 Nouns
+
+-- The worst case gives six forms.
+-- In practice just a couple of forms are needed to define the different
+-- stems, vowel alternation, and vowel harmony.
+
+oper
+
+-- The regular noun heuristic takes just one form (singular
+-- nominative) and analyses it to pick the correct paradigm.
+-- It does automatic grade alternation, and is hence not usable
+-- for words like "auto" (whose genitive would become "audon").
+--
+-- If the one-argument paradigm does not give the correct result, one can try and give 
+-- two or three forms. Most notably, the two-argument variant is used
+-- for nouns like "kivi - kiviä", which would otherwise become like
+-- "rivi - rivejä". Three arguments are used e.g. for 
+-- "auto - auton - autoja", which would otherwise become
+-- "auto - audon".
+
+  mkN : overload {
+    mkN : (kukko : Str) -> N ;  -- predictable nouns, covers 82%
+    mkN : (savi,savia : Str) -> N ; -- different pl.part
+    mkN : (vesi,veden,vesia : Str) -> N ; -- also different sg.gen
+    mkN : (pank,panga,panka,panku : Str) -> N ; -- sg nom,gen,part, pl.part
+
+--    mkN : (olo,n,a,na,oon,jen,ja,ina,issa,ihin : Str) -> N ; -- worst case, 10 forms
+    mkN : (oun,ouna,ouna,ounasse,ounte,ounu : Str) -> N ; -- worst case, 6 forms
+    mkN : (oun,ouna,ouna,ounasse,ounte,ounu,ountesse : Str) -> N ; -- worst case, 7 forms
+    mkN : (pika : Str) -> (juna  : N) -> N ; -- compound with invariable prefix
+    mkN : (oma : N)    -> (tunto : N) -> N ; -- compound with inflecting prefix
+    mkN : NW -> N ;  -- noun from DictEst (WordNet)
+  } ;
+
+-- Nouns used as functions need a case, of which the default is
+-- the genitive.
+
+  mkN2 : overload {
+    mkN2 : N -> N2 ;        -- relational noun with genitive
+    mkN2 : N -> Prep -> N2  -- relational noun another prep.
+    } ;
+
+  mkN3  : N -> Prep -> Prep -> N3 ; -- relation with two complements
+
+-- Proper names can be formed by using declensions for nouns.
+-- The plural forms are filtered away by the compiler.
+
+  mkPN : overload {
+    mkPN : Str -> PN ;  -- predictable noun made into name
+    mkPN : N -> PN      -- any noun made into name
+    } ;
+
+--2 Adjectives
+
+-- Non-comparison one-place adjectives are just like nouns.
+-- The regular adjectives are based on $regN$ in the positive.
+-- Comparison adjectives have three forms. 
+-- The comparative and the superlative
+-- are always inflected in the same way, so the nominative of them is actually
+-- enough (TODO: confirm).
+-- TODO: update these types to include the new boolean non-inflection marker
+
+  mkA : overload {
+    mkA : Str -> A ;  -- regular noun made into adjective
+    mkA : N -> A ;    -- any noun made into adjective
+    mkA : N -> (infl : Bool) -> A ; -- noun made into adjective, agreement type specified
+    mkA : N -> (parem, parim : Str) -> A ; -- deviating comparison forms
+    mkA : AW -> A ;  -- adjective from DictEst (WordNet)
+  } ;
+
+-- Two-place adjectives need a case for the second argument.
+
+  mkA2 : A -> Prep -> A2  -- e.g. "jaollinen" casePrep adessive
+    = \a,p -> a ** {c2 = p ; lock_A2 = <>};
+
+  genAttrA : Str -> A ; -- genitive attributes ; no agreement to head, no comparison forms. 
+
+--2 Verbs
+--
+-- The grammar does not cover the quotative mood and some nominal
+-- forms. One way to see the coverage is to linearize a verb to
+-- a table.
+-- The worst case needs eight forms, as shown in the following.
+
+  mkV : overload {
+    mkV : (lugema : Str) -> V ;     -- predictable verbs, covers n %
+    mkV : (lugema,lugeda : Str) -> V ; -- deviating past 3sg
+    mkV : (lugema,loeb,lugeda : Str) -> V ; -- also deviating pres. 1sg
+    mkV : (lugema,lugeda,loeb,loetakse : Str) -> V ;
+    mkV : (tegema,teha,teeb,tehakse,tehke,tegi,teinud,tehtud : Str) -> V ; -- worst-case verb
+    mkV : (saama : V) -> (aru : Str) -> V ; -- püsiühendid TODO
+    mkV : VW -> V ;  -- verb from DictEst (WordNet)
+  } ;
+
+-- All the patterns above have $nominative$ as subject case.
+-- If another case is wanted, use the following.
+
+  caseV : Case -> V -> V ;  -- deviating subj. case, e.g. genitive "täytyä"
+
+-- The verbs "be" and "go" are special.
+
+  vOlema : V ; -- the verb "be"
+  vMinema : V ; -- the verb "go"
+
+
+--3 Two-place verbs
+--
+-- Two-place verbs need an object case, and can have a pre- or postposition.
+-- The default is direct (accusative) object. There is also a special case
+-- with case only. The string-only argument case yields a regular verb with
+-- accusative object.
+
+  mkV2 : overload {
+    mkV2 : Str -> V2 ;  -- predictable direct transitive
+    mkV2 : V -> V2 ;    -- direct transitive
+    mkV2 : V -> Case -> V2 ; -- complement just case
+    mkV2 : V -> Prep -> V2 ; -- complement pre/postposition
+    } ;
+
+
+--3 Three-place verbs
+--
+-- Three-place (ditransitive) verbs need two prepositions, of which
+-- the first one or both can be absent.
+
+  mkV3     : V -> Prep -> Prep -> V3 ;  -- e.g. puhua, allative, elative
+  dirV3    : V -> Case -> V3 ;          -- siirtää, (accusative), illative
+  dirdirV3 : V         -> V3 ;          -- antaa, (accusative), (allative)
+
+
+--3 Other complement patterns
+--
+-- Verbs and adjectives can take complements such as sentences,
+-- questions, verb phrases, and adjectives.
+
+  mkV0  : V -> V0 ; --%
+  mkVS  : V -> VS ;
+  mkV2S : V -> Prep -> V2S ; -- e.g. "sanoa" allative
+  mkVV  : V -> VV ;  -- e.g. "alkaa"
+  mkVVf : V -> InfForm -> VV ; -- e.g. "hakkama" infMa
+  mkV2V : V -> Prep -> V2V ;  -- e.g. "käskeä" genitive
+  mkV2Vf : V -> Prep -> InfForm -> V2V ; -- e.g. "kieltää" partitive infMast  
+  mkVA  : V -> Prep -> VA ; -- e.g. "maistua" ablative
+  mkV2A : V -> Prep -> Prep -> V2A ; -- e.g. "maalata" accusative translative
+  mkVQ  : V -> VQ ; 
+  mkV2Q : V -> Prep -> V2Q ; -- e.g. "kysyä" ablative 
+
+  mkAS  : A -> AS ; --%
+  mkA2S : A -> Prep -> A2S ; --%
+  mkAV  : A -> AV ; --%
+  mkA2V : A -> Prep -> A2V ; --%
+
+-- Notice: categories $AS, A2S, AV, A2V$ are just $A$, 
+-- and the second argument is given
+-- as an adverb. Likewise 
+-- $V0$ is just $V$.
+
+  V0 : Type ; --%
+  AS, A2S, AV, A2V : Type ; --%
+
+--.
+-- The definitions should not bother the user of the API. So they are
+-- hidden from the document.
+
+  Case = MorphoEst.Case ;
+  Number = MorphoEst.Number ;
+
+  singular = Sg ;
+  plural = Pl ;
+
+  nominative = Nom ;
+  genitive = Gen ;
+  partitive = Part ;
+  illative = Illat ;
+  inessive = Iness ;
+  elative = Elat ;
+  allative = Allat ;
+  adessive = Adess ;
+  ablative = Ablat ;
+  translative = Transl ;
+  terminative = Termin ;
+  essive  = Ess ;
+  abessive = Abess ;  
+  comitative = Comit ;
+ 
+  infDa = InfDa ; infMa = InfMa ; infMast = InfMast ;
+  infDes = InfDes ; infMas = InfMas ; infMaks = InfMaks ; infMata = InfMata ;
+
+  prePrep  : Case -> Str -> Prep = 
+    \c,p -> {c = NPCase c ; s = p ; isPre = True ; lock_Prep = <>} ;
+  postPrep : Case -> Str -> Prep =
+    \c,p -> {c = NPCase c ; s = p ; isPre = False ; lock_Prep = <>} ;
+  postGenPrep p = {
+    c = NPCase genitive ; s = p ; isPre = False ; lock_Prep = <>} ;
+  casePrep : Case -> Prep =
+    \c -> {c = NPCase c ; s = [] ; isPre = True ; lock_Prep = <>} ;
+  accPrep =  {c = NPAcc ; s = [] ; isPre = True ; lock_Prep = <>} ;
+
+  NW = {s : NForms ; lock_NW : {}} ;
+  AW = {s : NForms ; lock_AW : {}} ;
+  VW = {s : VForms ; lock_VW : {}} ;
+  AdvW = {s : Str ; lock_AdvW : {}} ;
+
+
+  mkN = overload {
+    mkN : (nisu : Str) -> N = mk1N ;
+    mkN : (link,lingi : Str) -> N = mk2N ;
+    mkN : (tukk,tuku,tukku : Str) -> N = mk3N ;
+    mkN : (paat,paadi,paati,paatide : Str) -> N = mk4N ;
+    mkN : (oun,ouna,ouna,ounasse,ounte,ounu : Str) -> N = mk6N ;
+
+    mkN : (sora : Str) -> (tie : N) -> N = mkStrN ;
+    mkN : (oma,tunto : N) -> N = mkNN ;
+    mkN : (sana : NW) -> N = \w -> nForms2N w.s ;
+  } ;
+
+  -- Adjective forms (incl. comp and sup) are derived from noun forms
+  mk1A : Str -> A = \suur -> 
+    let aforms = aForms2A (nforms2aforms (hjk_type suur)) 
+    in  aforms ** {infl = Regular } ;
+      
+  mkNA : N -> A = \suur -> 
+    let aforms = aForms2A (nforms2aforms (n2nforms suur)) ; 
+    in  aforms ** {infl = Regular } ;
+
+
+  mk1N : (link : Str) -> N = \s -> nForms2N (hjk_type s) ** {lock_N = <> } ;
+
+  mk2N : (link,lingi : Str) -> N = \link,lingi -> 
+    let nfs : NForms = (nForms2 link lingi) ; 
+        nfs_fixed : NForms = table {
+                0 => link ;
+                1 => lingi ;
+                2 => nfs ! 2 ;
+                3 => nfs ! 3 ;
+                4 => nfs ! 4 ;
+                5 => nfs ! 5 
+        } ;
+    in  nForms2N nfs_fixed ** {lock_N = <> } ;
+
+
+  mk3N : (tukk,tuku,tukku : Str) -> N = \tukk,tuku,tukku -> 
+    let nfs : NForms = (nForms3 tukk tuku tukku) ; 
+        nfs_fixed : NForms = table {
+                0 => tukk ;
+                1 => tuku ;
+                2 => tukku ;
+                3 => nfs ! 3 ;
+                4 => nfs ! 4 ;
+                5 => nfs ! 5  
+        } ;
+    in nForms2N nfs_fixed ** {lock_N = <> } ;
+
+{-  mk1N : (link : Str) -> N = \s -> nForms2N (hjk_type s) ** {lock_N = <> } ;
+  mk2N : (link,lingi : Str) -> N = \s,t -> nForms2N (nForms2 s t)  ** {lock_N = <>} ;
+  mk3N : (tukk,tuku,tukku : Str) -> N = \s,t,u -> nForms2N (nForms3 s t u) ** {lock_N = <>} ;  
+  --regular mk4N
+  mk4N : (paat,paadi,paati,paate : Str) -> N = \s,t,u,v -> nForms2N (nForms4 s t u v) ** {lock_N = <>} ;
+-}
+
+  --experimental: make sure that the user specified forms end up in the paradigm, even though the rest is wrong
+  --this is using pl part
+  mk4N : (paat,paadi,paati,paatide : Str) -> N = \paat,paadi,paati,paate ->  
+    let nfs : NForms = (nForms4 paat paadi paati paate) ; 
+        nfs_fixed : NForms = table {
+                0 => paat ;
+                1 => paadi ;
+                2 => paati ;
+                3 => nfs ! 3 ;
+                4 => nfs ! 4 ; 
+                5 => paate 
+        } ;
+    in nForms2N nfs_fixed ** {lock_N = <> } ;
+
+
+  mk6N : (oun,ouna,ouna,ounasse,ounte,ounu : Str) -> N =
+      \a,b,c,d,e,f -> nForms2N (nForms6 a b c d e f) ** {lock_N = <> } ;
+
+  mkStrN : Str -> N -> N = \sora,tie -> {
+    s = \\c => sora + tie.s ! c ; lock_N = <>
+    } ;
+  mkNN : N -> N -> N = \oma,tunto -> {
+    s = \\c => oma.s ! c + tunto.s ! c ; lock_N = <>
+    } ; ---- TODO: oma in possessive suffix forms
+
+  nForms2 : (_,_ : Str) -> NForms = \link,lingi -> 
+    let
+      i = last lingi ;
+      reegl = init lingi ;
+    in
+      case <link,lingi> of { 
+        <_ + "el", _ + #c + "li"> => hjk_type_IVb_audit1 link reegl ;
+        <_ + "er", _ + #c + "ri"> => hjk_type_IVb_audit1 link reegl ;
+        <_ + #c + "el", _ + #c + "eli"> => hjk_type_IVb_audit link i ;
+        <_ + #c + "er", _ + #c + "eri"> => hjk_type_IVb_audit link i ;
+
+        <_ + "be", _ + "pe">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "de", _ + "te">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "ge", _ + "ke">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "pe", _ + "ppe">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "te", _ + "tte">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "ke", _ + "kke">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "nne", _ + "nde">  => hjk_type_VII_touge2 link lingi ;
+
+	--below 3 don't add much, could just delete
+	--t6uge recognition is easy, because that doesn't introduce lot of other errors
+	--but probably pointless to fill this with all cases
+	<_ + "e", _ + #c + "me"> => hjk_type_VII_touge2 link lingi ;
+        <_ + "se", _ + "ske">  => hjk_type_VII_touge2 link lingi ;
+        <_ + "re", _ + "rde">  => hjk_type_VII_touge2 link lingi ;
+	<_ + #v + "e", _+"de"> => hjk_type_VII_touge2 link lingi ; --riie:riide
+
+	--improved total count a little, but introduced new errors
+	--not recommended, not stable and productive word class
+	--<_ + "i", _ + "e">  => dMeri link lingi ;
+
+	--introduced a couple of errors, "aine" recognized as "kõne"
+        --<_ + "ne", _ + "ne">  => hjk_type_III_ratsu link ;
+
+        --heuristics to catch palk:palga but not maakas:maaka (for longer words, same with more ?s)
+        --didn't work, don't try this
+        --<? + ? + #c, ? + ? + #c + #v> => hjk_type_IVb_audit link i ; 
+        _ => hjk_type link 
+      } ;
+
+  nForms3 : (_,_,_ : Str) -> NForms = \tukk,tuku,tukku ->
+    let u = last tuku ;
+    in  case <tukk,tuku,tukku> of {
+      --cases handled reliabl(ish) by 1- and 2-arg opers
+      <_+"nd",_,_> => hjk_type tukk ;
+      <_+"el",_,_> => nForms2 tukk tuku ;
+      <_+"er",_,_> => nForms2 tukk tuku ;
+
+      --distinguish between hammas and maakas
+      <_+"as",_+"a",_+"ast"> => dHammas tukk tuku ;
+      <_+"es",_+"e",_+"est"> => dHammas tukk tuku ;
+      <_+"us",_+"u",_+"ust"> => dHammas tukk tuku ;
+      <_+"as",_,_+"at"> => hjk_type_IVb_maakas tukk ;
+
+      <_ + "ik", _ + "iku", _ + "ikku"> => hjk_type_VI_imelik tukk ; --imelik:_:imelikku caught here
+
+      <_ + #c, _ + #v, _ + #v> => hjk_type_VI_tukk tukk tuku ;
+      <_ + "ud", _ + "u", _ + "ut"> => nForms2 tukk tuku ;  -- -nud/-tud participles are not like 'voolik'
+      <_ + #c, _ + #v, _ + #v + "t"> => hjk_type_IVb_audit tukk u ;  --voolik:_:voolikut caught here
+      _ => nForms2 tukk tuku 
+    } ;
+
+  nForms4 : (_,_,_,_ : Str) -> NForms = \paat,paadi,paati,paate -> 
+    case <paat,paadi,paati,paate> of {
+     -- distinguish between joonis and segadus
+      <_ +("ne"|"s"),  _+"se", _+"st", _+"seid"> => hjk_type_Va_otsene paat ;
+      <_ +("ne"|"s"),  _+"se", _+"st", _+"si"> => hjk_type_Vb_oluline paat ;
+      
+      <_ +"ne", _+"se", _+"set", _+"seid"> => nForms3 paat paadi paati ; -- -ne adjectives ('algne') are not like 'tõuge'
+
+      --distinguish between kõne and aine
+      <_ +"e", _+"e", _+"et", _+"sid"> => hjk_type_III_ratsu paat ; 
+      <_ +"e", _+"e", _+"et", _+"eid"> => hjk_type_VII_touge2 paat paadi ;
+
+      _  => nForms3 paat paadi paati 
+      } ;
+{-
+  --Version that uses pl gen instead of pl part
+  nForms4 : (_,_,_,_ : Str) -> NForms = \paat,paadi,paati,paatide -> 
+    case <paat,paadi,paati,paatide> of {
+     -- pl gen can't distinguish between joonis and segadus
+    --  <_ +("ne"|"s"),  _+"se", _+"st", _+"seid"> => hjk_type_Va_otsene paat ;
+    --  <_ +("ne"|"s"),  _+"se", _+"st", _+"si"> => hjk_type_Vb_oluline paat ;
+      
+      --pl gen can distinguish between kõne and aine
+      --plus side that any noun that is formed with 4-arg,
+      --the user given forms are inserted to the paradigm, 
+      --and more forms are created from pl gen, none from pl part
+      <_ +"e", _+"e", _+"et", _+"de"> => hjk_type_III_ratsu paat ; 
+      <_ +"e", _+"e", _+"et", _+"te"> => hjk_type_VII_touge2 paat paadi ;
+
+      _  => nForms3 paat paadi paati 
+      } ;      
+-}
+
+  mkN2 = overload {
+    mkN2 : N -> N2 = \n -> mmkN2 n (casePrep genitive) ;
+    mkN2 : N -> Prep -> N2 = mmkN2
+    } ;
+
+  mmkN2 : N -> Prep -> N2 = \n,c -> n ** {c2 = c ; isPre = mkIsPre c ; lock_N2 = <>} ;
+  mkN3 = \n,c,e -> n ** {c2 = c ; c3 = e ; 
+    isPre = mkIsPre c  ; -- matka Lontoosta Pariisiin
+    isPre2 = mkIsPre e ;          -- Suomen voitto Ruotsista
+    lock_N3 = <>
+    } ;
+  
+  mkIsPre : Prep -> Bool = \p -> case p.c of {
+    NPCase Gen => notB p.isPre ;  -- Jussin veli (prep is <Gen,"",True>, isPre becomes False)
+    _ => True                     -- syyte Jussia vastaan, puhe Jussin puolesta
+    } ;
+
+  mkPN = overload {
+    mkPN : Str -> PN = mkPN_1 ;
+    mkPN : N -> PN = \s -> {s = \\c => s.s ! NCase Sg c ; lock_PN = <>} ;
+    } ;
+
+  mkPN_1 : Str -> PN = \s -> {s = \\c => (mk1N s).s ! NCase Sg c ; lock_PN = <>} ;
+
+-- adjectives
+
+  mkA = overload {
+    mkA : Str -> A  = mkA_1 ;
+    mkA : N -> A = \n -> noun2adjDeg n ** {infl = Regular ; lock_A = <>} ;
+    mkA : N -> (parem,parim : Str) -> A = regAdjective ;
+    mkA : N -> (infl : Infl) -> A = \n,infl -> noun2adjDeg n ** {infl = infl ; lock_A = <>} ;
+    -- TODO: temporary usage of regAdjective1
+    mkA : N -> (valmim,valmeim : Str) -> (infl : Infl) -> A =
+		\n,c,s,infl -> (regAdjective1 n c s) ** {infl = infl ; lock_A = <>} ;
+    mkA : (sana : AW) -> A = \w -> noun2adjDeg (nForms2N w.s) ** {infl = Regular} ;
+  } ;
+
+  genAttrA balti = {s = \\_,_ => balti ; infl = Invariable ; lock_A = <>} ;
+
+  mkA_1 : Str -> A = \x -> noun2adjDeg (mk1N x) ** {infl = Regular  ; lock_A = <>} ;
+
+-- auxiliaries
+  mkAdjective : (_,_,_ : Adj) -> A = \hea,parem,parim -> 
+    {s = table {
+      Posit  => hea.s ;
+      Compar => parem.s ;
+      Superl => parim.s
+      } ;
+     infl = Regular ;
+     lock_A = <>
+    } ;
+
+  -- Adjectives whose comparison forms are explicitly given.
+  -- The inflection of these forms with the audit-rule always works.
+  regAdjective : Noun -> Str -> Str -> A = \posit,compar,superl ->
+    mkAdjective 
+      (noun2adj posit) 
+      (noun2adjComp False (nForms2N (hjk_type_IVb_audit compar "a")))
+      (noun2adjComp False (nForms2N (hjk_type_IVb_audit superl "a"))) ;
+
+  -- TODO: this is a temporary hack that converts A ~> Adjective.
+  -- The caller needs this otherwise ** fails.
+  -- This should be cleaned up but I don't know how (K).
+  regAdjective1 : Noun -> Str -> Str -> Adjective = regAdjective ;
+
+  -- Adjectives whose comparison forms can be derived from the sg gen.
+  -- In case of comparative this fails only for 70 adjectives.
+  -- Superlative is more complex, and does not always exist,
+  -- e.g. lai -> laiem -> laiim? / laieim?
+  -- See also: http://www.eki.ee/books/ekk09/index.php?p=3&p1=4&id=208
+  -- Rather use "kõige" + Comp instead of the superlative.
+  noun2adjDeg : Noun -> Adjective = \kaunis ->
+    let
+      kauni = (kaunis.s ! NCase Sg Gen) ;
+      -- Convert the final 'i' to 'e' for the superlative
+      kaune : Str = case kauni of { kaun@(_) + "i" => kaun + "e" ; _ => kauni }
+    in
+    regAdjective kaunis (kauni + "m") (kaune + "im") ;
+
+
+-- verbs
+
+  mkV = overload {
+    mkV : (lugema : Str) -> V = mk1V ;
+    mkV : (lugema,lugeda : Str) -> V = mk2V ;
+    mkV : (lugema,lugeda,loeb : Str) -> V = mk3V ;
+    mkV : (lugema,lugeda,loeb,loetakse : Str) -> V = mk4V ;
+    mkV : (tegema,teha,teeb,tehakse,tehke,tegi,teinud,tehtud : Str) -> V = mk8V ;
+    mkV : (aru : Str) -> (saama : V) -> V = mkPV ; -- particle verbs
+    mkV : (sana : VW) -> V = \w -> vforms2V w.s ** {sc = NPCase Nom ; lock_V = <>} ;
+  } ;
+
+  mk1V : Str -> V = \s -> 
+    let vfs = vforms2V (vForms1 s) in 
+      vfs ** {sc = NPCase Nom ; lock_V = <>} ;
+  mk2V : (_,_ : Str) -> V = \x,y -> 
+    let 
+      vfs = vforms2V (vForms2 x y) 
+    in vfs ** {sc = NPCase Nom ; lock_V = <>} ;
+  mk3V : (_,_,_ : Str) -> V = \x,y,z -> 
+    let 
+      vfs = vforms2V (vForms3 x y z) 
+    in vfs ** {sc = NPCase Nom ; lock_V = <>} ;
+  mk4V : (x1,_,_,x4 : Str) -> V = \a,b,c,d -> 
+    let 
+      vfs = vforms2V (vForms4 a b c d)
+    in vfs ** {sc = NPCase Nom ; lock_V = <>} ;
+  mk8V : (x1,_,_,_,_,_,_,x8 : Str) -> V = \a,b,c,d,e,f,g,h -> 
+    let
+      vfs = vforms2V (vForms8 a b c d e f g h)
+    in vfs ** {sc = NPCase Nom ; lock_V = <>} ;
+  mkPV : (aru : Str) -> (saama : V) -> V = \aru,saama ->
+    {s = saama.s ; p = aru ; sc = saama.sc ; lock_V = <> } ;
+     
+  	
+  -- This used to be the last case: _ => Predef.error (["expected infinitive, found"] ++ ottaa) 
+  -- regexp example: ("" | ?) + ("a" | "e" | "i") + _ + "aa" => 
+  vForms1 : Str -> VForms = \lugema ->
+    let
+      luge = Predef.tk 2 lugema ;
+      loe = weaker luge ;
+    in
+    case lugema of {
+      -- TS 49
+      -- Small class of CVVma
+      ? + ("ä"|"õ"|"i") + "ima" =>
+        cKaima lugema ;  --käima,viima,võima
+      ? + ("aa"|"ee"|"ää") + "ma" =>  
+        cSaama lugema ;  -- saama,jääma,keema
+      ? + ("oo"|"öö"|"üü") + "ma" =>
+        cJooma lugema ;  --jooma,looma,lööma,müüma,pooma,sööma,tooma
+
+      -- TS 53
+      _ + #c + #v + "elema" =>
+        cTegelema lugema ; --not aelema
+      
+      -- TS 54
+      -- Small class, just list all members
+      ("tule"|"sure"|"pane") + "ma" =>
+        cTulema lugema ;
+        
+      -- TS 55-57
+      -- Consonant gradation
+      -- Regular (55-56)'leppima' and irregular (57) 'lugema'
+      -- For reliable results regarding consonant gradation, use mk3V
+      _ + "ndima" =>
+        cLeppima lugema ;
+      _ + #lmnr + ("k"|"p"|"t"|"b") + ("ima"|"uma") => 
+        cLeppima lugema ;
+      _ + ("sk"|"ps"|"ks"|"ts"|"pl") + ("ima") => --|"uma") => 
+        cLeppima lugema ;
+      _ + ("hk"|"hm"|"hn"|"hr"|"ht") + ("ima") => --most *hCuma are TS 51 (muutuma) 
+        cLeppima lugema ;
+      _ + #c + "ssima" => --weaker *ss = *ss; should be weaker Css = Cs
+        cLugema lugema ;
+      _ + ("pp"|"kk"|"tt"|"ss"|"ff"|"nn"|"mm"|"ll"|"rr") + ("ima"|"uma") => 
+        cLeppima lugema ;
+      
+      -- TS 59 (petma, tapma) 
+      -- Use mk4V for TS 60 (jätma, võtma)
+      ? + #v + ("tma"|"pma") =>
+        cPetma lugema (luge + "etakse") ;
+      -- TS 58 for rest that end tma (muutma,kartma,...)
+      _ + "tma" =>
+        cMuutma lugema ;
+
+     -- TS 61 (laulma,kuulma,naerma,möönma)
+     -- Default vowel e for lma, a for (r|n)ma.
+     -- Other vowel with mk3V.
+      _ + "lma" => 
+        cKuulma lugema (loe + "eb") ; 
+      _ + ("r"|"n") + "ma" =>
+        cKuulma lugema (loe + "ab") ;
+     
+      -- TS 63 (andma,hoidma)
+      -- Other vowel than a (tundma~tunneb) with mk3V
+      _ + "dma" =>
+        cAndma lugema (loe + "ab") ;
+             
+      -- TS 62, 64 (tõusma,mõskma), default vowel e
+      -- 62 alt form (jooksma,joosta) with mk2V
+      -- Other vowel than e with mk3V
+      _ + #c + "ma" => 
+        cLaskma lugema (loe + "eb") ;
+        
+      -- TS 65 (pesema)
+      #c + #v + "sema" =>
+        cPesema lugema ;
+        
+      -- TS 66 (nägema)
+      -- Small class, just list all members
+      ("nägema"|"tegema") =>
+        cNagema lugema ;
+      
+      -- TS 67-68 with mk2V
+      -- no 100% way to distinguish from 50-52 that end in ama
+
+      -- TS 69
+      (?|"") + (?|"") + ? + "tlema" => --vestlema,mõtlema,ütlema; not õnnitlema
+        cOmblema lugema ;
+      _ + "tlema" =>
+        cElama lugema ;
+      _ + #c + "lema" =>
+        cOmblema lugema ;
+
+      -- TS 50-52
+      -- Default case
+      _ =>
+        cElama lugema
+    } ;   
+
+  vForms2 : (_,_ : Str) -> VForms = \petma,petta ->
+    -- Arguments: ma infinitive, da infinitive
+    -- Use this for the following cases:
+    -- * 62 alt form (Csma, sta)
+    -- * 50-52 (elama) recognized as 69 (õmblema)
+    -- * 66 (nägema~näha)
+    -- * 54 (tulema~tulla)
+    -- * 67-68 (hüppama~hüpata)
+    case <petma,petta> of {
+      <_ + "ksma", _ + "sta"> => cJooksma petma ; --62 alt forms
+      <_,          _ + "ata"> => cHyppama petma ; --67-68
+      <_,          _ + "ha"> => cNagema petma ; --66
+      <_,          _ + ("rra"|"lla"|"nna")> => cTulema petma ; --54
+      <_ + #c + "lema",
+       _ + #c + "leda"> => cElama petma ; --50-52 (õnnitlema) recognized as 69 (mõtlema)
+       _ => vForms1 petma
+      } ;
+
+  vForms3 : (_,_,_ : Str) -> VForms = \taguma,taguda,taob ->
+    -- Arguments: ma infinitive, da infinitive, b
+    -- Use this for the following cases:
+    -- * Irregular gradation (taguma~taob)
+    -- * Non-detectable gradation (sattuma~satub ; pettuma~pettub)
+    -- * Non-default vowel in b for TS 58-64 (laulma~laulab)
+    case <taguma,taguda,taob> of {
+    
+      --to be sure about vowel in b
+      <_ + "dma", _ + "da", _> => cAndma taguma taob ;
+      <_, _ + #vv + #lmnr + "da", _> => cKuulma taguma taob ;
+      <_, _ + #c + "ta", _> => cLaskma taguma taob ; 
+
+      --irregular gradation
+      <_, _, (""|#c) + #c + #v + #v + "b"> => cLugema taguma ; --57
+
+      --to be sure about consonant gradation
+      <_ + #c + "lema", _, _> => vForms2 taguma taguda ; --catch "-Clema" first
+      <_ + #v + "ma", _+"da", _> => cSattumaPettuma taguma taob ; 
+
+      <_,_,_> => vForms2 taguma taguda      
+    } ;
+    
+  vForms4 : (x1,_,_,x4 : Str) -> VForms = \jatma,jatta,jatab,jaetakse ->
+    -- 4 forms needed to get full paradigm for regular verbs
+    -- (source: http://www.eki.ee/books/ekk09/index.php?p=3&p1=5&id=227)
+    -- regVForms in MorphoEst handles majority of these.
+    -- Filter out known irregularities and give rest to regVForms.
+    -- Not trying to match TS 49 ; can't separate käima (49) from täima (50), or detect compounds like taaslooma.
+    case <jatma,jatta,jatab,jaetakse> of {
+      <_,          _+("kka"|"ppa"|"tta"), 
+       _,          _+"takse"> => cPetma jatma jaetakse ;
+      <_ + "dma",  _,
+       _,          _+"takse"> => cAndma jatma jatab ;
+      <_ + ("ts"|"ks"|"sk") + "ma", _,_,_> => cLaskma jatma jatab ;
+      <_, _ + ("lla"|"nna"|"rra"), _, _> => cTulema jatma ;
+      <_, _ + "ha", _, _> => cNagema jatma ;
+      <_ + #v + "sema", _ + "sta", _, _> => cPesema jatma ;
+      <_,_,_,_> => regVForms jatma jatta jatab jaetakse
+    } ;    
+    
+  caseV c v = {s = v.s ; p = v.p; sc = NPCase c ; lock_V = <>} ;
+
+  vOlema = verbOlema ** {sc = NPCase Nom ; lock_V = <>} ;
+  vMinema = verbMinema ** {sc = NPCase Nom ; lock_V = <>} ;
+
+  mk2V2 : V -> Prep -> V2 = \v,c -> v ** {c2 = c ; lock_V2 = <>} ;
+  caseV2 : V -> Case -> V2 = \v,c -> mk2V2 v (casePrep c) ; 
+  dirV2 v = mk2V2 v accPrep ;
+
+  mkAdv = overload { 
+    mkAdv : Str -> Adv = \s -> {s = s ; lock_Adv = <>} ;
+    mkAdv : AdvW -> Adv = \s -> {s = s.s ; lock_Adv = <>} ;
+    } ;
+
+  mkV2 = overload {
+    mkV2 : Str -> V2 = \s -> dirV2 (mk1V s) ;
+    mkV2 : V -> V2 = dirV2 ;
+    mkV2 : V -> Case -> V2 = caseV2 ;
+    mkV2 : V -> Prep -> V2 = mk2V2 ;
+    } ;
+
+  mk2V2 : V -> Prep -> V2 ;
+  caseV2 : V -> Case -> V2 ;
+  dirV2 : V -> V2 ;
+
+  mkV3 v p q = v ** {c2 = p ; c3 = q ; lock_V3 = <>} ; 
+  dirV3 v p = mkV3 v accPrep (casePrep p) ;
+  dirdirV3 v = dirV3 v allative ;
+
+  mkVS  v = v ** {lock_VS = <>} ;
+  mkVV  v = mkVVf v infDa ;
+  mkVVf  v f = v ** {vi = f ; lock_VV = <>} ;
+  mkVQ  v = v ** {lock_VQ = <>} ;
+
+  V0 : Type = V ;
+  AS, A2S, AV : Type = A ;
+  A2V : Type = A2 ;
+
+  mkV0  v = v ** {lock_V = <>} ;
+  mkV2S v p = mk2V2 v p ** {lock_V2S = <>} ;
+  mkV2V v p = mkV2Vf v p infMa ;
+  mkV2Vf v p f = mk2V2 v p ** {vi = f ; lock_V2V = <>} ;
+
+  mkVA  v p = v ** {c2 = p ; lock_VA = <>} ;
+  mkV2A v p q = v ** {c2 = p ; c3 = q ; lock_V2A = <>} ;
+  mkV2Q v p = mk2V2 v p ** {lock_V2Q = <>} ;
+
+  mkAS  v = v ** {lock_A = <>} ;
+  mkA2S v p = mkA2 v p ** {lock_A = <>} ;
+  mkAV  v = v ** {lock_A = <>} ;
+  mkA2V v p = mkA2 v p ** {lock_A2 = <>} ;
+
+} ;