forked from GitHub/gf-core
final version of kotus experiment
This commit is contained in:
169
doc/gf-bib.bib
169
doc/gf-bib.bib
@@ -112,6 +112,13 @@
|
||||
PUBLISHER = {{Springer-Verlag}}
|
||||
}
|
||||
|
||||
@book{CopestakeLKB,
|
||||
AUTHOR = {A. Copestake},
|
||||
TITLE = {{Implementing Typed Feature Structure Grammars}},
|
||||
YEAR = {2002},
|
||||
PUBLISHER = {{CSLI Publications}}
|
||||
}
|
||||
|
||||
@book{stroustrup,
|
||||
AUTHOR = {B. Stroustrup},
|
||||
TITLE = {{The C++ Programming Language, Third Edition}},
|
||||
@@ -287,6 +294,30 @@
|
||||
year = {2002}
|
||||
}
|
||||
|
||||
@InProceedings{saghein-1978,
|
||||
author = "Anna {S\aa gvall Hein}",
|
||||
title = {{Finnish Morphological Analysis in the Reversible Grammar System}},
|
||||
booktitle = {{COLING 78, Information Abstracts}},
|
||||
year = {1978}
|
||||
}
|
||||
|
||||
@ARTICLE{saghein-1980,
|
||||
AUTHOR = "Anna {S\aa gvall Hein}",
|
||||
TITLE = "An Outline of a Computer Model of Finnish Word Recognition",
|
||||
JOURNAL = {{Fenno-Ugrica Suecana}},
|
||||
VOLUME = {3},
|
||||
PAGES = {7--26},
|
||||
YEAR = {1980} }
|
||||
|
||||
@ARTICLE{koskenniemi-1980,
|
||||
AUTHOR = "Kimmo Koskenniemi",
|
||||
TITLE = "On Automatic Lemmatization of Finnish",
|
||||
JOURNAL = {{Fenno-Ugrica Suecana}},
|
||||
VOLUME = {3},
|
||||
PAGES = {27--44},
|
||||
YEAR = {1980} }
|
||||
|
||||
|
||||
@book{martin-lof,
|
||||
AUTHOR = {P. Martin-L\"{o}f},
|
||||
TITLE = {{Intuitionistic Type Theory}},
|
||||
@@ -512,6 +543,15 @@
|
||||
year = 2001
|
||||
}
|
||||
|
||||
@inproceedings{carlson-2005,
|
||||
title = {{Inducing a Morphological Transducer from Inflectional Paradigms}},
|
||||
author = {Lauri Carlson},
|
||||
booktitle = {{Inquiries into Words, Constraints and Contexts.
|
||||
Festschrift for Kimmo Koskenniemi on his 60th Birthday}},
|
||||
publisher = {{CSLI}},
|
||||
year = 2005
|
||||
}
|
||||
|
||||
@BOOK{dowty,
|
||||
AUTHOR = "Dowty, D",
|
||||
TITLE = "Word Meaning and Montague Grammar",
|
||||
@@ -856,6 +896,17 @@
|
||||
pages = {607--639}
|
||||
}
|
||||
|
||||
@inproceedings{TomitaCarbobell,
|
||||
author = {Masaru Tomita and
|
||||
Jaime G. Carbonell},
|
||||
title = {The Universal Parser Architecture for Knowledge-based Machine
|
||||
Translation},
|
||||
booktitle = {IJCAI},
|
||||
year = {1987},
|
||||
pages = {718-721},
|
||||
bibsource = {DBLP, http://dblp.uni-trier.de}
|
||||
}
|
||||
|
||||
|
||||
@InProceedings{luocall,
|
||||
author = {Z. Luo and P. Callaghan},
|
||||
@@ -1023,14 +1074,61 @@
|
||||
volume={14(2)},
|
||||
YEAR = {2004} }
|
||||
|
||||
@ARTICLE{huet-2005,
|
||||
AUTHOR = "Gerard Huet",
|
||||
TITLE = {{A Functional Toolkit for Morphological and Phonological Processing, Application to a Sanskrit Tagger}},
|
||||
JOURNAL = {{The Journal of Functional Programming}},
|
||||
pages={573--614},
|
||||
volume={15(4)},
|
||||
YEAR = {2005} }
|
||||
|
||||
@InProceedings{extract-2006,
|
||||
AUTHOR = "M. Forsberg and H. Hammarstroem and A. Ranta",
|
||||
TITLE = {{Morphological Lexicon Extraction from Raw Text Data}},
|
||||
booktitle = {{FinTAL 2006}},
|
||||
year = {{2006}},
|
||||
series = {{LNCS/LNAI}},
|
||||
volume = {4139},
|
||||
editor = {T. Salakoski}
|
||||
}
|
||||
|
||||
@misc{minnen95offline,
|
||||
author = "G. Minnen and D. Gerdemann and T. Gotz",
|
||||
title = "Off-line optimization for Earleystyle hpsg processing",
|
||||
text = "G. Minnen, D. Gerdemann, and T. Gotz. Off-line optimization for Earleystyle
|
||||
hpsg processing. In Proc. of the 7th Conference of the eacl, Dublin, 1995.",
|
||||
year = "1995",
|
||||
url = "citeseer.ist.psu.edu/article/minnen95offline.html" }
|
||||
|
||||
@Misc{Happy-GLR,
|
||||
author = {P. Callaghan and B. Medlock},
|
||||
title = {{Happy-GLR}},
|
||||
note = {\verb6http://www.dur.ac.uk/p.c.callaghan/happy-glr/6},
|
||||
year = 2004
|
||||
}
|
||||
|
||||
@Misc{XLE-homepage,
|
||||
author = {R. Kaplan and J. Maxwell},
|
||||
title = {{XLE Project Homepage}},
|
||||
note = {\verb6http://www2.parc.com/isl/groups/nltt/xle/6},
|
||||
year = 2007
|
||||
}
|
||||
|
||||
|
||||
|
||||
@Misc{GF-homepage,
|
||||
author = {A. Ranta},
|
||||
title = {{Grammatical Framework Homepage}},
|
||||
note = {\verb6www.cs.chalmers.se/~aarne/GF/6},
|
||||
url = "http://www.cs.chalmers.se/~aarne/GF/",
|
||||
year = 2002
|
||||
note = {\verb6digitalgrammars.com/gf6},
|
||||
url = "digitalgrammars.com/gf",
|
||||
year = 2008
|
||||
}
|
||||
|
||||
@Misc{kotus-wordlist,
|
||||
author = "{Kotimaisten Kielten Tutkimuskeskus}",
|
||||
title = {{KOTUS Wordlist}},
|
||||
note = {\verb6kaino.kotus.fi/sanat/nykysuomi6},
|
||||
year = 2006
|
||||
}
|
||||
|
||||
@Misc{happy,
|
||||
@@ -1050,6 +1148,27 @@
|
||||
YEAR = {1994}
|
||||
}
|
||||
|
||||
@Book{nssk,
|
||||
editor = {M. Sadeniemi},
|
||||
title = {{Nykysuomen sanakirja}},
|
||||
publisher = {{WSOY}},
|
||||
year = {1961}
|
||||
}
|
||||
|
||||
@Book{hellberg,
|
||||
author = {S. Hellberg},
|
||||
title = {{The Morphology of Present-Day Swedish}},
|
||||
publisher = {{Almqvist \& Wiksell}},
|
||||
year = {1978}
|
||||
}
|
||||
|
||||
@Book{karlsson-1977,
|
||||
author = {F. Karlsson},
|
||||
title = {{Finsk grammatik}},
|
||||
publisher = {{Suomalaisen Kirjallisuuden Seura}},
|
||||
year = {1977}
|
||||
}
|
||||
|
||||
@Book{Ranta94,
|
||||
author = {A. Ranta},
|
||||
title = {{Type Theoretical Grammar}},
|
||||
@@ -1072,6 +1191,14 @@
|
||||
year = 1998
|
||||
}
|
||||
|
||||
@InProceedings{brodda-karlsson,
|
||||
author = {B. Brodda and F. Karlsson},
|
||||
title = {{An experiment with Automatic morphological Analysis of Finnish}},
|
||||
series = {{Papers from the Institute of Linguistics, University of Stockholm}},
|
||||
volume = 40,
|
||||
year = 1978
|
||||
}
|
||||
|
||||
|
||||
|
||||
@PhdThesis{fiedler,
|
||||
@@ -1081,6 +1208,14 @@
|
||||
year = 2001
|
||||
}
|
||||
|
||||
@PhdThesis{koskenniemi-1983,
|
||||
author = {Kimmo Koskenniemi},
|
||||
title = {{Two-Level Morphology: A General Computational Model for
|
||||
Word-Form Recognition and Production}},
|
||||
school = {{University of Helsinki}},
|
||||
year = 1983
|
||||
}
|
||||
|
||||
@PhdThesis{peb,
|
||||
author = {P. Ljungl\"of},
|
||||
title = {{The Expressivity and Complexity of Grammatical Framework}},
|
||||
@@ -1090,6 +1225,16 @@
|
||||
year = {2004}
|
||||
}
|
||||
|
||||
@PhdThesis{forsberg-2007,
|
||||
author = {Markus Forsberg},
|
||||
title = {{Three Tools for Language Processing: BNF Converter,
|
||||
Functional Morphology, and Extract}},
|
||||
school = {{Dept.\ of Computer Science and Engineering,
|
||||
Chalmers University of Technology and
|
||||
Gothenburg University}},
|
||||
year = {2007}
|
||||
}
|
||||
|
||||
@InProceedings{peb-parsing,
|
||||
author = {P. Ljungl\"of},
|
||||
title = {{Grammatical Framework and Multiple Context-Free Grammars}},
|
||||
@@ -1203,6 +1348,17 @@
|
||||
url = "ftp://ftp.cs.iastate.edu/pub/techreports/TR98-06/TR.ps.gz"
|
||||
}
|
||||
|
||||
@inproceedings{nlyacc,
|
||||
author = {Masayuki Ishii and Kazuhisa Ohta and Hiroaki Saito},
|
||||
title = {An efficient parser generator for natural language},
|
||||
booktitle = {Proceedings of the 15th conference on Computational linguistics},
|
||||
year = {1994},
|
||||
pages = {417--420},
|
||||
location = {Kyoto, Japan},
|
||||
doi = {http://dx.doi.org/10.3115/991886.991959},
|
||||
publisher = {Association for Computational Linguistics},
|
||||
address = {Morristown, NJ, USA},
|
||||
}
|
||||
|
||||
@TechReport{johnson-yacc,
|
||||
author = {S. C. Johnson},
|
||||
@@ -1894,6 +2050,13 @@
|
||||
year = {{1998}}
|
||||
}
|
||||
|
||||
@Book{LindholmYellinJVM,
|
||||
editor = {T. Lindholm and F. Yellin},
|
||||
title = {{The Java Virtual Machine Specification Second Edition}},
|
||||
publisher = {{Addison-Wesley}},
|
||||
year = {{1999}}
|
||||
}
|
||||
|
||||
@Book{VanDerLinden99a,
|
||||
author = "Peter {van der Linden}",
|
||||
title = "Just {Java} 1.2",
|
||||
|
||||
@@ -30,15 +30,19 @@ oper
|
||||
d08A : Str -> NForms -- 5 vinaigrette
|
||||
= \s -> dNukke s (weakGrade s + "n") ;
|
||||
d09 : Str -> NForms -- 696 ääriraja
|
||||
= \s -> dUkko s (s + "n") ;
|
||||
= \s -> let a = last s in dSilakka s
|
||||
(s + "n")
|
||||
(init s + case a of {"a" => "o" ; _ => "ö"} + "j" + a) ;
|
||||
d09A : Str -> NForms -- 1040 ääniraita
|
||||
= \s -> dUkko s (s + weakGrade "n") ;
|
||||
= \s -> let a = last s in dSilakka s
|
||||
(weakGrade s + "n")
|
||||
(init s + case a of {"a" => "o" ; _ => "ö"} + "j" + a) ;
|
||||
d10 : Str -> NForms -- 2119 äänittäjä
|
||||
= \s -> dSilakka s (s + "n") (init s + "i" + vowelHarmony (last s)) ;
|
||||
d10A : Str -> NForms -- 284 änkkä
|
||||
= \s -> dUkko s (weakGrade s + "n") ;
|
||||
= \s -> dSilakka s (weakGrade s + "n") (init s + "i" + vowelHarmony (last s)) ;
|
||||
d11 : Str -> NForms -- 46 ödeema
|
||||
= \s -> dUkko s (s + "n") ;
|
||||
= \s -> dSilakka s (weakGrade s + "n") (init s + "i" + vowelHarmony (last s)) ;
|
||||
d12 : Str -> NForms -- 1125 örinä
|
||||
= \s -> let a = vowelHarmony (last s) in
|
||||
dSilakka s (s + "n")
|
||||
@@ -174,7 +178,10 @@ oper
|
||||
d48A : Str -> NForms -- 481 äänne
|
||||
= \s -> dRae s (strongGrade s + "en") ;
|
||||
d49 : Str -> NForms -- 31 vempele
|
||||
= \s -> dRae s (s + "en") ;
|
||||
= \s -> case last s of {
|
||||
"e" => dRae s (s + "en") ;
|
||||
_ => dPiennar s (s + "en")
|
||||
} ;
|
||||
d49A : Str -> NForms -- 11 vemmel
|
||||
= \s -> dPiennar s (strongGrade (init s) + "len") ;
|
||||
{-
|
||||
|
||||
@@ -14,8 +14,8 @@ verbs:
|
||||
cat all-differences-V
|
||||
|
||||
nouns:
|
||||
export LEX=NSSK ; make -e tests
|
||||
export LEX=Omat ; make -e tests
|
||||
# export LEX=NSSK ; make -e tests
|
||||
# export LEX=Omat ; make -e tests
|
||||
export LEX=Swadesh ; make -e tests
|
||||
export LEX=Dictionary ; make -e tests
|
||||
export LEX=Duodecim ; make -e tests
|
||||
@@ -33,13 +33,13 @@ CSC:
|
||||
|
||||
gf-files:
|
||||
runghc MkLex.hs 0 $(CAT) $(LEX) > $(LEX)Abs.gf
|
||||
runghc MkLex.hs 1 $(CAT) $(LEX) > $(LEX)1.gf
|
||||
# runghc MkLex.hs 1 $(CAT) $(LEX) > $(LEX)1.gf
|
||||
runghc MkLex.hs 2 $(CAT) $(LEX) > $(LEX)2.gf
|
||||
runghc MkLex.hs 3 $(CAT) $(LEX) > $(LEX)3.gf
|
||||
runghc MkLex.hs 4 $(CAT) $(LEX) > $(LEX)4.gf
|
||||
|
||||
experiments: gf-files
|
||||
echo "gt -cat=Utt | l | wf exper1-$(LEX).txt" | gf -s $(LEX)1.gf
|
||||
# echo "gt -cat=Utt | l | wf exper1-$(LEX).txt" | gf -s $(LEX)1.gf
|
||||
echo "gt -cat=Utt | l | wf exper2-$(LEX).txt" | gf -s $(LEX)2.gf
|
||||
echo "gt -cat=Utt | l | wf exper3-$(LEX).txt" | gf -s $(LEX)3.gf
|
||||
echo "gt -cat=Utt | l | wf exper4-$(LEX).txt" | gf -s $(LEX)4.gf
|
||||
|
||||
@@ -144,6 +144,10 @@ resource Nominal = ResFin ** open MorphoFin,Declensions,CatFin,Prelude in {
|
||||
dArpi ukko (init (weakGrade ukko) + "en") ;
|
||||
<_ + "i", _ + ("eita" | "eitä")> =>
|
||||
dTohtori ukko ;
|
||||
<_ + "e", nuk + ("eja" | "ejä")> =>
|
||||
dNukke ukko ukon ;
|
||||
<_, _ + ":" + _ + ("a" | "ä")> => dSDP ukko ;
|
||||
<_ + ("l" | "n" | "r" | "s"), _ + ("eja" | "ejä")> => dUnix ukko ;
|
||||
<_, _ + ("a" | "ä")> => ukot ;
|
||||
_ =>
|
||||
Predef.error
|
||||
@@ -168,7 +172,7 @@ resource Nominal = ResFin ** open MorphoFin,Declensions,CatFin,Prelude in {
|
||||
dRae ukko ukon ;
|
||||
<taiv + ("as" | "äs"), taiv + ("aan" | "ään")> =>
|
||||
dRae ukko ukon ;
|
||||
<nukk + "e", nuk + "en"> => dNukke ukko ukon ;
|
||||
<nukk + "e", nuk + "een"> => dRae ukko ukon ;
|
||||
<arp + "i", arv + "en"> => dArpi ukko ukon ;
|
||||
<_ + ("us" | "ys"), _ + "den"> => dLujuus ukko ;
|
||||
<_, _ + ":n"> => dSDP ukko ;
|
||||
|
||||
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user