From 22de842e37a8136a8c556bdbe6bab4180d62a240 Mon Sep 17 00:00:00 2001 From: Julia Jansson Date: Thu, 30 Apr 2020 17:24:46 +0200 Subject: [PATCH 1/3] Documentation --- src/hungarian/LexiconHun.gf | 2 +- src/hungarian/NounMorphoHun.gf | 5 +++-- src/hungarian/README.md | 9 ++++++++- 3 files changed, 12 insertions(+), 4 deletions(-) diff --git a/src/hungarian/LexiconHun.gf b/src/hungarian/LexiconHun.gf index deda0643c..2de054a31 100644 --- a/src/hungarian/LexiconHun.gf +++ b/src/hungarian/LexiconHun.gf @@ -140,7 +140,7 @@ lin forest_N = mkN "erdő" "erdőt" ; -- lin freeze_V = mkV "" ; lin fridge_N = mkN "hűtő" "hűtőt" ; lin friend_N = mkN "barát" "barátot" ; -lin fruit_N = mkN "gyümölcs" "gyümölcsöt" "gyümölcsök" "gyümölcse" ; +lin fruit_N = mkN "gyümölcs" "gyümölcsöt" "gyümölcsök" "gyümölcse" ; --TODO: plural PossPl2 fails "gyümölcseitek" instead of "gyümölcseitök", wovel harmony changing? lin full_A = mkA "tele" ; -- --lin fun_AV diff --git a/src/hungarian/NounMorphoHun.gf b/src/hungarian/NounMorphoHun.gf index 5b08fb429..b5056d651 100644 --- a/src/hungarian/NounMorphoHun.gf +++ b/src/hungarian/NounMorphoHun.gf @@ -184,7 +184,7 @@ oper -- orr, orr|ot -> orr|a -- TODO fails for gyümölcs, gyümölcs|öt -> gyümölcs|e - -- I don't know what this list means /IL + -- This list could maybe be deleted _ + #v + ("sz"|"z"|"s"|"zs"|"j"|"ly"|"l"|"r"|"n"|"ny" |"ssz"|"zz"|"ss"|"ll"|"rr"|"nn"|"ns"|"nsz"|"nz") + ("o"|"ö") => init tolla ; @@ -242,7 +242,8 @@ oper -- More words not covered by current paradigms: -- https://cl.lingfil.uu.se/~bea/publ/megyesi-hungarian.pdf - -- TODO: teher ~ terhet (consonant-crossing) + -- TODO: teher ~ terhet (consonant-crossing) works in all cases except ParamHun.PossdSg_PossrPl1 + -- Worst case constructor: takes all stems worstCaseNoun : (x1,_,_,_,_,_,_,x8 : Str) -> Harm -> Noun = diff --git a/src/hungarian/README.md b/src/hungarian/README.md index f9857d1e5..2a1775a46 100644 --- a/src/hungarian/README.md +++ b/src/hungarian/README.md @@ -8,7 +8,7 @@ ## Authors -Inari Listenmaa, Julia Jansson, 2020- +Inari Listenmaa, Julia Jansson, 2020-04 With contributions from Erzsébet Galgóczy (initial nominal morphology) and Patrik Jansson (numerals). @@ -20,6 +20,13 @@ With contributions from Erzsébet Galgóczy (initial nominal morphology) and Pat So far (2020-03) just copypasted a dummy module with Hungarian words that inflect mostly wrong or not at all. This will change in a few weeks. +(2020-04) +A basic RGL exists with focus on noun inflection in NounMorphoHun.gf. First the implementation of NounMorphoHun.gf was in paradigms taking one argument (nominative) with different cases for plural, accusative and superessive cases. NounMorphoHun.gf also includes wovels, consonants and double/triple consonants, and functions using wovel harmony for the different stems. Since accusative has shown to be irregular the structure was changed to multi-argument paradigms taking nominative and accusative, from this the paradigms could be simplified much, and yield correct results to a higher degree. For cases when only nominative is entered as an argument there is a function that guesses accusative from nominative, but it is better to use several arguments. + +Later, possessive stem inflection was implemented which was quite complicated. Some paradigms take possessive forms as arguments, others have rules were using the accusative was enough. However the irregularity in possessive forms showed that several possessive arguments may be necessary for yielding correct results. Special cases are noted in NounMorphoHun.gf and LexiconHun.gf. For all these to work some more work on wovel harmony and the paradigms need to be done. Furthermore, not all 21 cases are implemented in NounMorphoHun.gf; it is missing the cases Essive, Temporal, Formal and Terminative. + +TLDR; a basic noun inflection structure covering most cases and possessive suffixes is implemented. There are special cases that need to be fixed, there is work left on wovel harmony and adding the missing cases. + ## Maintainer From edf7f60a5fadb760dcaf6566e3f4a9069f73cbad Mon Sep 17 00:00:00 2001 From: Julia Jansson Date: Thu, 30 Apr 2020 17:31:35 +0200 Subject: [PATCH 2/3] Update README.md --- src/hungarian/README.md | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/src/hungarian/README.md b/src/hungarian/README.md index 2a1775a46..c87203ff4 100644 --- a/src/hungarian/README.md +++ b/src/hungarian/README.md @@ -8,7 +8,7 @@ ## Authors -Inari Listenmaa, Julia Jansson, 2020-04 +Inari Listenmaa, Julia Jansson, 2020- With contributions from Erzsébet Galgóczy (initial nominal morphology) and Patrik Jansson (numerals). @@ -17,10 +17,7 @@ With contributions from Erzsébet Galgóczy (initial nominal morphology) and Pat - ## Implementation information - -So far (2020-03) just copypasted a dummy module with Hungarian words that inflect mostly wrong or not at all. This will change in a few weeks. - -(2020-04) +(2020-04) - Julia Jansson A basic RGL exists with focus on noun inflection in NounMorphoHun.gf. First the implementation of NounMorphoHun.gf was in paradigms taking one argument (nominative) with different cases for plural, accusative and superessive cases. NounMorphoHun.gf also includes wovels, consonants and double/triple consonants, and functions using wovel harmony for the different stems. Since accusative has shown to be irregular the structure was changed to multi-argument paradigms taking nominative and accusative, from this the paradigms could be simplified much, and yield correct results to a higher degree. For cases when only nominative is entered as an argument there is a function that guesses accusative from nominative, but it is better to use several arguments. Later, possessive stem inflection was implemented which was quite complicated. Some paradigms take possessive forms as arguments, others have rules were using the accusative was enough. However the irregularity in possessive forms showed that several possessive arguments may be necessary for yielding correct results. Special cases are noted in NounMorphoHun.gf and LexiconHun.gf. For all these to work some more work on wovel harmony and the paradigms need to be done. Furthermore, not all 21 cases are implemented in NounMorphoHun.gf; it is missing the cases Essive, Temporal, Formal and Terminative. From 52d475e0409e244cd2834a5d5d93665a3685be23 Mon Sep 17 00:00:00 2001 From: Julia Jansson Date: Thu, 30 Apr 2020 17:31:52 +0200 Subject: [PATCH 3/3] Update README.md --- src/hungarian/README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/src/hungarian/README.md b/src/hungarian/README.md index c87203ff4..6328829ad 100644 --- a/src/hungarian/README.md +++ b/src/hungarian/README.md @@ -18,6 +18,7 @@ With contributions from Erzsébet Galgóczy (initial nominal morphology) and Pat ## Implementation information (2020-04) - Julia Jansson + A basic RGL exists with focus on noun inflection in NounMorphoHun.gf. First the implementation of NounMorphoHun.gf was in paradigms taking one argument (nominative) with different cases for plural, accusative and superessive cases. NounMorphoHun.gf also includes wovels, consonants and double/triple consonants, and functions using wovel harmony for the different stems. Since accusative has shown to be irregular the structure was changed to multi-argument paradigms taking nominative and accusative, from this the paradigms could be simplified much, and yield correct results to a higher degree. For cases when only nominative is entered as an argument there is a function that guesses accusative from nominative, but it is better to use several arguments. Later, possessive stem inflection was implemented which was quite complicated. Some paradigms take possessive forms as arguments, others have rules were using the accusative was enough. However the irregularity in possessive forms showed that several possessive arguments may be necessary for yielding correct results. Special cases are noted in NounMorphoHun.gf and LexiconHun.gf. For all these to work some more work on wovel harmony and the paradigms need to be done. Furthermore, not all 21 cases are implemented in NounMorphoHun.gf; it is missing the cases Essive, Temporal, Formal and Terminative.