catalan_smart_paradigms

MorphoCat and ParadigmsCat: smart paradigms for adjectives. 
ExtraCat: added costruction for negative imperative.
This commit is contained in:
inari.listenmaa
2012-10-19 09:36:37 +00:00
parent e666fa838f
commit 606f8bece8
4 changed files with 202 additions and 67 deletions

View File

@@ -28,31 +28,31 @@ oper
nomCasa : Str -> Str -> Number => Str = \es,casa ->
numForms casa (init casa + es) ;
numForms casa (init casa + es) ;
nomFre : Str -> Number => Str = \fre ->
numForms fre (fre + "ns") ;
numForms fre (fre + "ns") ;
nomCas : Str -> Number => Str = \cas ->
numForms cas (cas + "os") ;
numForms cas (cas + "os") ;
nomTest : Str -> Number => Str = \test ->
numForms test (variants {test + "s"; test + "os"}) ;
numForms test (variants {test + "s"; test + "os"}) ;
nomFaig : Str -> Number => Str = \faig ->
let
fa = Predef.tk 2 faig
in
numForms faig (variants {fa + "jos" ; faig + "s"}) ;
let
fa = Predef.tk 2 faig
in
numForms faig (variants {fa + "jos" ; faig + "s"}) ;
nomDesig : Str -> Number => Str = \desig ->
let
desi = Predef.tk 1 desig
in
numForms desig (variants {desi + "tjos" ; desi + "gs"}) ;
let
desi = Predef.tk 1 desig
in
numForms desig (variants {desi + "tjos" ; desi + "gs"}) ;
nomTemps : Str -> Number => Str = \temps ->
numForms temps temps ;
numForms temps temps ;
-- Common nouns are inflected in number and have an inherent gender.
@@ -63,18 +63,18 @@ oper
mkNoun (numForms vi vins) ;
mkNomReg : Str -> Noun = \noi ->
let
mkNounMas : (Str -> Number => Str) -> Noun = \rule -> mkNoun (rule noi) Masc
in
let
mkNounMas : (Str -> Number => Str) -> Noun = \rule -> mkNoun (rule noi) Masc
in
case last noi of {
"a" => mkNoun (nomCasa "es" noi) Fem ;
"s"|"x"|"ç" => mkNounMas nomCas ;
"i" => mkNounMas nomFre ;
"í" => mkNounMas (nomCasa "ins") ;
"à" => mkNounMas (nomCasa "ans") ;
"ó" => mkNounMas (nomCasa "ons") ;
"g" => mkNounMas nomFaig ;
_ => mkNounMas nomCep
"a" => mkNoun (nomCasa "es" noi) Fem ;
"s"|"x"|"ç" => mkNounMas nomCas ;
"i" => mkNounMas nomFre ;
"í" => mkNounMas (nomCasa "ins") ;
"à" => mkNounMas (nomCasa "ans") ;
"ó" => mkNounMas (nomCasa "ons") ;
"g" => mkNounMas nomFaig ;
_ => mkNounMas nomCep
} ;
--2 Adjectives
@@ -97,33 +97,155 @@ oper
mkAdj prim (prim + "a") (prim + "s") (prim + "es") (prim + "ament") ;
adjBlau : Str -> Str -> Adj = \blau,blava ->
let
blav = Predef.tk 1 blava
in
mkAdj blau blava (blau + "s") (blav + "es") (blava + "ment") ;
let blav = Predef.tk 1 blava
in mkAdj blau blava (blau + "s") (blav + "es")
(blava + "ment") ;
adjFondo : Str -> Adj = \fondo ->
let
fond = Predef.tk 1 fondo
in
adjBlau fondo (fond + "a") ;
let fond = Predef.tk 1 fondo
in adjBlau fondo (fond + "a") ;
adjBo : Str -> Adj = \bo ->
mkAdj bo (bo + "na") (bo + "ns") (bo + "nes") (bo + "nament") ;
mkAdj bo (bo + "na") (bo + "ns") (bo + "nes") (bo + "nament") ;
adjFidel : Str -> Adj = \fidel ->
let
fidels = fidel + "s"
in
mkAdj fidel fidel fidels fidels (fidel + "ment") ;
let fidels : Str = case (last fidel) of {
_ + ("s"|"ç"|"x") => fidel + "os" ; --feliç; capaç
_ => fidel + "s"
} ;
in mkAdj fidel fidel fidels fidels
(fidel + "ment") ;
--boig, boja, bojos, boges
--lleig, lletja, lletjos, lletges
adjIg : Str -> Str -> Adj = \boig,boja ->
let boj : Str = tk 1 boja ;
llet : Str = tk 1 boj
in mkAdj boig (boj + "a") (boj + "os") (llet + "ges")
(boj + "ament") ;
--públic pública públics públiques
--llarg llarga llargs llargues
adjXc : Str -> Adj = \blanc ->
let blan : Str = init blanc ;
blanqu : Str = case last blanc of {
"c" => blan + "qu" ;
"g" => blan + "gu" --llarg, not boig.
} ;
in mkAdj blanc (blanc + "a")
(blanc + "s") (blanqu + "es")
(blanc + "ament") ;
--sibilant endings
adjXs : Str -> Str -> Adj = \famos,famosa ->
let russ : Str = tk 1 famosa ;
in mkAdj famos famosa (russ + "os") (russ + "es")
(russ + "ament") ;
-- català catalana catalans catalanes
adjVn : Str -> Adj = \catalA ->
let catal : Str = init catalA ;
v : Str = unaccent (last catalA) ;
catalVn : Str = catal + v + "n" ;
in mkAdj catalA (catalVn + "a")
(catalVn + "s") (catalVn + "es")
(catalVn + "ament") ;
--casat casada ; groc groga
adjCasat : Str -> Adj = \casat ->
let casa : Str = init casat ;
casad : Str = case last casat of {
"t" => casa + "d" ;
"c" => casa + "g"
} ;
grogu : Str = case last casad of {
"g" => casa + "gu" ;
_ => casad
} ;
in mkAdj casat (casad + "a")
(casat + "s") (grogu + "es")
(casad + "ament") ;
-- francès francesa francesos franceses
adjFrances : Str -> Adj = \francEs ->
let franc : Str = tk 2 francEs ;
e : Str = last (tk 1 francEs) ;
v : Str = unaccent e ;
francVs : Str = franc + v + "s"
in mkAdj francEs (francVs + "a")
(francVs + "os") (francVs + "es")
(francVs + "ament") ;
--europeu europea europeus europees
adjEuropeu : Str -> Adj = \europeu ->
let europe : Str = tk 1 europeu ;
in mkAdj europeu (europe + "a")
(europeu + "s") (europe + "es")
(europe + "ament") ;
--belga belga belgues belgues
adjBelga : Str -> Adj = \belga ->
let belg : Str = init belga ;
belgu : Str = case last belg of {
("g"|"c") => belg + "u" ;
_ => belg
} ;
belgues : Str = belgu + "es"
in mkAdj belga belga belgues belgues (belga + "ment") ;
mkAdjReg : Str -> Adj = \prim ->
case prim of {
-- _ + "e" + ("r"|"l") => adjPrim prim ;
_ + "l" => adjFidel prim ;
_ + ("e"|"u"|"o") => adjFondo prim ;
_ => adjPrim prim
} ;
case prim of {
_ + "ll" => adjPrim prim ; --vell~vella
_ + "rn" => adjPrim prim ; --modern~moderna
_ + ("l"|"n"|"ç") => adjFidel prim ; --local; gran; capaç. For espanyol~espanyola mk2A.
_ + "a" => adjBelga prim ; --invariable, -es in plural
_ + ("eu") => adjFidel prim ; --greu; breu. most "eu" are invariable, europeu and jueu with mk2A.
_ + ("au"|"ou"|"iu") => adjBlau prim (tk 1 prim + "va"); --blau; nou; viu
_ + ("e"|"o") => adjFondo prim ;
_ + "ig" => adjIg prim (tk 2 prim + "ja") ; --boig~boja. lleig~lletja with mk2A.
_ + ("c"|"g") => adjXc prim ; --públic; llarg. cec~cega with mk2A
_ + ("n"|"l"|"r"|"s") + "t" => adjPrim prim ; --mort,llest,distint
_ + "t" => adjCasat prim ; --tancat~tancada. petit~petita with mk2A.
_ + ("à"|"é"|"è"|"í"|"ó"|"ò"|"ú") => adjVn prim ; --comú~comuna
_ + ("à"|"é"|"è"|"í"|"ó"|"ò"|"ú") + "s" => adjFrances prim ;
_ + ("s"|"x") => adjXs prim (prim + "a") ; --divers~diversa
_ => adjPrim prim
} ;
--Used for the following:
--diferent diferent : doesn't end in l/n/ç/eu but has invariant feminine
--petit petita petits petites : voiceless plosive in the stem.
--ridícul ridícula : ends in l/n/ç but is not invariant.
--lleig lletja : the geminated variant of boig boja
--bo bona ; pla plana : like adjVn, but for one syllable words
--diari diària ; ingenu ingènua : in feminine, stress in antepenultimate
--jueu jueva ; europeu europea : exceptional paradigms for "eu" ending
--rus russa : voiceless s in the stem
--groc groga : voiced g in the stem
mkAdj2Reg : Str -> Str -> Adj = \petit,petita ->
case <petit,petita> of {
<_, _ + ("b"|"c"|"d"|"e"|"f"|"g"|"h"|"i"|"j"|"k"|"l"|"m"|"n"|"o"|"p"|"q"|"r"|"s"|"t"|"u"|"v"|"x"|"y"|"z")> => adjFidel petit ; --feminine doesn't end in "a"
<p@(_ + ("t"|"l"|"ç")), p+"a"> => adjPrim petit ; --1) petit~petita 2) ridícul~ridícula, dolç~dolça
<_ + "ig", _> => adjIg petit petita ; --lleig~letja
<_, _+ "na"> => adjVn petit ; --pla~plana
<_, _ + ("à"|"é"|"è"|"í"|"ó"|"ò"|"ú") + _> => adjBlau petit petita ; --diari~diària
<_ + "u" , _ + "va"> => adjBlau petit petita ; --jueu~jueva
<_ + "eu", _ + "ea"> => adjEuropeu petit ; --europeu~europea
<_ + "s" , _> => adjXs petit petita ; --rus~russa
<_ + "c" , _ + "ga"> => adjCasat petit ; --groc~groga
_ => mkAdjReg petit
} ;
oper unaccent : Str -> Str = \vocal ->
case vocal of {
("é"|"è") => "e" ;
("ó"|"ò") => "o" ;
"à" => "a" ;
"í" => "i" ;
"ú" => "u" ;
_ => vocal
} ;
--2 Personal pronouns
@@ -146,7 +268,7 @@ oper
poss = \\n,g => case <n,g> of {
<Sg,Masc> => son ;
<Sg,Fem> => sa ;
<Pl,Masc> => elsSeus ;
<Pl,Masc> => elsSeus ;
<Pl,Fem> => lesSeves
} ;
a = Ag g n p ;