final version of kotus experiment

This commit is contained in:
aarne
2008-02-18 18:20:42 +00:00
parent 389ba6058d
commit 4e3d240d2d
5 changed files with 1350 additions and 1152 deletions

View File

@@ -112,6 +112,13 @@
PUBLISHER = {{Springer-Verlag}}
}
@book{CopestakeLKB,
AUTHOR = {A. Copestake},
TITLE = {{Implementing Typed Feature Structure Grammars}},
YEAR = {2002},
PUBLISHER = {{CSLI Publications}}
}
@book{stroustrup,
AUTHOR = {B. Stroustrup},
TITLE = {{The C++ Programming Language, Third Edition}},
@@ -287,6 +294,30 @@
year = {2002}
}
@InProceedings{saghein-1978,
author = "Anna {S\aa gvall Hein}",
title = {{Finnish Morphological Analysis in the Reversible Grammar System}},
booktitle = {{COLING 78, Information Abstracts}},
year = {1978}
}
@ARTICLE{saghein-1980,
AUTHOR = "Anna {S\aa gvall Hein}",
TITLE = "An Outline of a Computer Model of Finnish Word Recognition",
JOURNAL = {{Fenno-Ugrica Suecana}},
VOLUME = {3},
PAGES = {7--26},
YEAR = {1980} }
@ARTICLE{koskenniemi-1980,
AUTHOR = "Kimmo Koskenniemi",
TITLE = "On Automatic Lemmatization of Finnish",
JOURNAL = {{Fenno-Ugrica Suecana}},
VOLUME = {3},
PAGES = {27--44},
YEAR = {1980} }
@book{martin-lof,
AUTHOR = {P. Martin-L\"{o}f},
TITLE = {{Intuitionistic Type Theory}},
@@ -512,6 +543,15 @@
year = 2001
}
@inproceedings{carlson-2005,
title = {{Inducing a Morphological Transducer from Inflectional Paradigms}},
author = {Lauri Carlson},
booktitle = {{Inquiries into Words, Constraints and Contexts.
Festschrift for Kimmo Koskenniemi on his 60th Birthday}},
publisher = {{CSLI}},
year = 2005
}
@BOOK{dowty,
AUTHOR = "Dowty, D",
TITLE = "Word Meaning and Montague Grammar",
@@ -856,6 +896,17 @@
pages = {607--639}
}
@inproceedings{TomitaCarbobell,
author = {Masaru Tomita and
Jaime G. Carbonell},
title = {The Universal Parser Architecture for Knowledge-based Machine
Translation},
booktitle = {IJCAI},
year = {1987},
pages = {718-721},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{luocall,
author = {Z. Luo and P. Callaghan},
@@ -1023,14 +1074,61 @@
volume={14(2)},
YEAR = {2004} }
@ARTICLE{huet-2005,
AUTHOR = "Gerard Huet",
TITLE = {{A Functional Toolkit for Morphological and Phonological Processing, Application to a Sanskrit Tagger}},
JOURNAL = {{The Journal of Functional Programming}},
pages={573--614},
volume={15(4)},
YEAR = {2005} }
@InProceedings{extract-2006,
AUTHOR = "M. Forsberg and H. Hammarstroem and A. Ranta",
TITLE = {{Morphological Lexicon Extraction from Raw Text Data}},
booktitle = {{FinTAL 2006}},
year = {{2006}},
series = {{LNCS/LNAI}},
volume = {4139},
editor = {T. Salakoski}
}
@misc{minnen95offline,
author = "G. Minnen and D. Gerdemann and T. Gotz",
title = "Off-line optimization for Earleystyle hpsg processing",
text = "G. Minnen, D. Gerdemann, and T. Gotz. Off-line optimization for Earleystyle
hpsg processing. In Proc. of the 7th Conference of the eacl, Dublin, 1995.",
year = "1995",
url = "citeseer.ist.psu.edu/article/minnen95offline.html" }
@Misc{Happy-GLR,
author = {P. Callaghan and B. Medlock},
title = {{Happy-GLR}},
note = {\verb6http://www.dur.ac.uk/p.c.callaghan/happy-glr/6},
year = 2004
}
@Misc{XLE-homepage,
author = {R. Kaplan and J. Maxwell},
title = {{XLE Project Homepage}},
note = {\verb6http://www2.parc.com/isl/groups/nltt/xle/6},
year = 2007
}
@Misc{GF-homepage,
author = {A. Ranta},
title = {{Grammatical Framework Homepage}},
note = {\verb6www.cs.chalmers.se/~aarne/GF/6},
url = "http://www.cs.chalmers.se/~aarne/GF/",
year = 2002
note = {\verb6digitalgrammars.com/gf6},
url = "digitalgrammars.com/gf",
year = 2008
}
@Misc{kotus-wordlist,
author = "{Kotimaisten Kielten Tutkimuskeskus}",
title = {{KOTUS Wordlist}},
note = {\verb6kaino.kotus.fi/sanat/nykysuomi6},
year = 2006
}
@Misc{happy,
@@ -1050,6 +1148,27 @@
YEAR = {1994}
}
@Book{nssk,
editor = {M. Sadeniemi},
title = {{Nykysuomen sanakirja}},
publisher = {{WSOY}},
year = {1961}
}
@Book{hellberg,
author = {S. Hellberg},
title = {{The Morphology of Present-Day Swedish}},
publisher = {{Almqvist \& Wiksell}},
year = {1978}
}
@Book{karlsson-1977,
author = {F. Karlsson},
title = {{Finsk grammatik}},
publisher = {{Suomalaisen Kirjallisuuden Seura}},
year = {1977}
}
@Book{Ranta94,
author = {A. Ranta},
title = {{Type Theoretical Grammar}},
@@ -1072,6 +1191,14 @@
year = 1998
}
@InProceedings{brodda-karlsson,
author = {B. Brodda and F. Karlsson},
title = {{An experiment with Automatic morphological Analysis of Finnish}},
series = {{Papers from the Institute of Linguistics, University of Stockholm}},
volume = 40,
year = 1978
}
@PhdThesis{fiedler,
@@ -1081,6 +1208,14 @@
year = 2001
}
@PhdThesis{koskenniemi-1983,
author = {Kimmo Koskenniemi},
title = {{Two-Level Morphology: A General Computational Model for
Word-Form Recognition and Production}},
school = {{University of Helsinki}},
year = 1983
}
@PhdThesis{peb,
author = {P. Ljungl\"of},
title = {{The Expressivity and Complexity of Grammatical Framework}},
@@ -1090,6 +1225,16 @@
year = {2004}
}
@PhdThesis{forsberg-2007,
author = {Markus Forsberg},
title = {{Three Tools for Language Processing: BNF Converter,
Functional Morphology, and Extract}},
school = {{Dept.\ of Computer Science and Engineering,
Chalmers University of Technology and
Gothenburg University}},
year = {2007}
}
@InProceedings{peb-parsing,
author = {P. Ljungl\"of},
title = {{Grammatical Framework and Multiple Context-Free Grammars}},
@@ -1203,6 +1348,17 @@
url = "ftp://ftp.cs.iastate.edu/pub/techreports/TR98-06/TR.ps.gz"
}
@inproceedings{nlyacc,
author = {Masayuki Ishii and Kazuhisa Ohta and Hiroaki Saito},
title = {An efficient parser generator for natural language},
booktitle = {Proceedings of the 15th conference on Computational linguistics},
year = {1994},
pages = {417--420},
location = {Kyoto, Japan},
doi = {http://dx.doi.org/10.3115/991886.991959},
publisher = {Association for Computational Linguistics},
address = {Morristown, NJ, USA},
}
@TechReport{johnson-yacc,
author = {S. C. Johnson},
@@ -1894,6 +2050,13 @@
year = {{1998}}
}
@Book{LindholmYellinJVM,
editor = {T. Lindholm and F. Yellin},
title = {{The Java Virtual Machine Specification Second Edition}},
publisher = {{Addison-Wesley}},
year = {{1999}}
}
@Book{VanDerLinden99a,
author = "Peter {van der Linden}",
title = "Just {Java} 1.2",

View File

@@ -30,15 +30,19 @@ oper
d08A : Str -> NForms -- 5 vinaigrette
= \s -> dNukke s (weakGrade s + "n") ;
d09 : Str -> NForms -- 696 ääriraja
= \s -> dUkko s (s + "n") ;
= \s -> let a = last s in dSilakka s
(s + "n")
(init s + case a of {"a" => "o" ; _ => "ö"} + "j" + a) ;
d09A : Str -> NForms -- 1040 ääniraita
= \s -> dUkko s (s + weakGrade "n") ;
= \s -> let a = last s in dSilakka s
(weakGrade s + "n")
(init s + case a of {"a" => "o" ; _ => "ö"} + "j" + a) ;
d10 : Str -> NForms -- 2119 äänittäjä
= \s -> dSilakka s (s + "n") (init s + "i" + vowelHarmony (last s)) ;
d10A : Str -> NForms -- 284 änkkä
= \s -> dUkko s (weakGrade s + "n") ;
= \s -> dSilakka s (weakGrade s + "n") (init s + "i" + vowelHarmony (last s)) ;
d11 : Str -> NForms -- 46 ödeema
= \s -> dUkko s (s + "n") ;
= \s -> dSilakka s (weakGrade s + "n") (init s + "i" + vowelHarmony (last s)) ;
d12 : Str -> NForms -- 1125 örinä
= \s -> let a = vowelHarmony (last s) in
dSilakka s (s + "n")
@@ -174,7 +178,10 @@ oper
d48A : Str -> NForms -- 481 äänne
= \s -> dRae s (strongGrade s + "en") ;
d49 : Str -> NForms -- 31 vempele
= \s -> dRae s (s + "en") ;
= \s -> case last s of {
"e" => dRae s (s + "en") ;
_ => dPiennar s (s + "en")
} ;
d49A : Str -> NForms -- 11 vemmel
= \s -> dPiennar s (strongGrade (init s) + "len") ;
{-

View File

@@ -14,8 +14,8 @@ verbs:
cat all-differences-V
nouns:
export LEX=NSSK ; make -e tests
export LEX=Omat ; make -e tests
# export LEX=NSSK ; make -e tests
# export LEX=Omat ; make -e tests
export LEX=Swadesh ; make -e tests
export LEX=Dictionary ; make -e tests
export LEX=Duodecim ; make -e tests
@@ -33,13 +33,13 @@ CSC:
gf-files:
runghc MkLex.hs 0 $(CAT) $(LEX) > $(LEX)Abs.gf
runghc MkLex.hs 1 $(CAT) $(LEX) > $(LEX)1.gf
# runghc MkLex.hs 1 $(CAT) $(LEX) > $(LEX)1.gf
runghc MkLex.hs 2 $(CAT) $(LEX) > $(LEX)2.gf
runghc MkLex.hs 3 $(CAT) $(LEX) > $(LEX)3.gf
runghc MkLex.hs 4 $(CAT) $(LEX) > $(LEX)4.gf
experiments: gf-files
echo "gt -cat=Utt | l | wf exper1-$(LEX).txt" | gf -s $(LEX)1.gf
# echo "gt -cat=Utt | l | wf exper1-$(LEX).txt" | gf -s $(LEX)1.gf
echo "gt -cat=Utt | l | wf exper2-$(LEX).txt" | gf -s $(LEX)2.gf
echo "gt -cat=Utt | l | wf exper3-$(LEX).txt" | gf -s $(LEX)3.gf
echo "gt -cat=Utt | l | wf exper4-$(LEX).txt" | gf -s $(LEX)4.gf

View File

@@ -144,6 +144,10 @@ resource Nominal = ResFin ** open MorphoFin,Declensions,CatFin,Prelude in {
dArpi ukko (init (weakGrade ukko) + "en") ;
<_ + "i", _ + ("eita" | "eitä")> =>
dTohtori ukko ;
<_ + "e", nuk + ("eja" | "ejä")> =>
dNukke ukko ukon ;
<_, _ + ":" + _ + ("a" | "ä")> => dSDP ukko ;
<_ + ("l" | "n" | "r" | "s"), _ + ("eja" | "ejä")> => dUnix ukko ;
<_, _ + ("a" | "ä")> => ukot ;
_ =>
Predef.error
@@ -168,7 +172,7 @@ resource Nominal = ResFin ** open MorphoFin,Declensions,CatFin,Prelude in {
dRae ukko ukon ;
<taiv + ("as" | "äs"), taiv + ("aan" | "ään")> =>
dRae ukko ukon ;
<nukk + "e", nuk + "en"> => dNukke ukko ukon ;
<nukk + "e", nuk + "een"> => dRae ukko ukon ;
<arp + "i", arv + "en"> => dArpi ukko ukon ;
<_ + ("us" | "ys"), _ + "den"> => dLujuus ukko ;
<_, _ + ":n"> => dSDP ukko ;

File diff suppressed because it is too large Load Diff