new big and shallow modules

This commit is contained in:
aarne
2006-11-02 17:04:35 +00:00
parent 4905ceac59
commit 13cd2b96be
12 changed files with 6312 additions and 67 deletions

View File

@@ -1,6 +1,8 @@
concrete BigLexEng of BigLexEngAbs = CatEng ** open ParadigmsEng in {
-- adapted from a word list by Alan Black. Not to be used for military purposes.
-- Adapted from a word list by Alan Black & al.
-- http://www.cs.cmu.edu/~awb/pub/map/MAP3.1.tar.gz
-- Not to be used for military purposes.
lin abandon24 = regV2 "abandon" "" ;
lin abbreviate25 = regV "abbreviate" ;
@@ -452,6 +454,7 @@ lin axiom533 = regN "axiom" ;
lin axiomatic534 = regA "axiomatic" ;
lin axiomatize535 = regV2 "axiomatize" "" ;
lin axis536 = regN "axis" ;
lin baby537 = regN "baby" ;
lin back538 = regN "back" ;
lin background539 = regN "background" ;
@@ -463,7 +466,7 @@ lin bacterium546 = regN "bacterium" ;
lin bad547 = regA "bad" ;
lin bag548 = regN "bag" ;
lin bake549 = regV2 "bake" "" ;
lin bake550 = regV2 "bake" "" ;
--lin bake550 = regV2 "bake" "" ;
lin balance551 = regV "balance" ;
lin ball552 = regN "ball" ;
lin ballad553 = regN "ballad" ;
@@ -474,7 +477,7 @@ lin bang557 = regN "bang" ;
lin banish558 = regV2 "banish" "" ;
lin bank559 = regN "bank" ;
lin bar560 = regN "bar" ;
lin bar561 = regV2 "bar" "" ;
lin bar561 = regV2 "bar" "" ;--
lin bare562 = regA "bare" ;
lin bare563 = regV2 "bare" "" ;
lin bark564 = regN "bark" ;
@@ -487,9 +490,9 @@ lin base570 = regV3 "base" "" "loc" ;
lin basic572 = regA "basic" ;
lin basically573 = mkAdv "basically" ;
lin basin574 = regN "basin" ;
lin basis575 = regN "basis" ;
lin basis576 = regN "basis" ;
lin basis577 = regN "basis" ;
lin basis575 = regN "basis" ;--
--lin basis576 = regN "basis" ;
--lin basis577 = regN "basis" ;
lin basket578 = regN "basket" ;
lin bat579 = regN "bat" ;
lin batch580 = regN "batch" ;
@@ -497,20 +500,20 @@ lin bath581 = regN "bath" ;
lin bathe582 = regV "bathe" ;
lin batsman583 = regN "batsman" ;
lin battle585 = regN "battle" ;
lin be586 = regV "be" ;
--lin be586 = regV "be" ;
lin beach587 = regN "beach" ;
lin beak588 = regN "beak" ;
lin beam589 = regN "beam" ;
lin bean590 = regN "bean" ;
lin bear591 = regN "bear" ;
lin bear592 = regV2 "bear" "" ;
--lin bear592 = regV2 "bear" "" ;
lin beard593 = regN "beard" ;
lin beast594 = regN "beast" ;
lin beat595 = regV2 "beat" "" ;
lin beat596 = regV2 "beat" "" ;
--lin beat596 = regV2 "beat" "" ;
lin beauty598 = regN "beauty" ;
lin become602 = regV2 "become" "" ;
lin become603 = regV2 "become" "" ;
--lin become603 = regV2 "become" "" ;
lin bed604 = regN "bed" ;
lin bee605 = regN "bee" ;
lin beer607 = regN "beer" ;
@@ -522,22 +525,22 @@ lin behave617 = regV "behave" ;
lin behaviour618 = regN "behaviour" ;
lin being621 = regN "being" ;
lin belief622 = regN "belief" ;
lin belief623 = regN "belief" ;
lin belief624 = regN "belief" ;
--lin belief623 = regN "belief" ;
--lin belief624 = regN "belief" ;
lin believe625 = regV2 "believe" "" ;
lin believe626 = regV2 "believe" "in" ;
lin believe627 = regV2 "believe" "" ;
lin believe628 = regV2 "believe" "" ;
lin believe629 = regV2 "believe" "" ;
--lin believe627 = regV2 "believe" "" ;
--lin believe628 = regV2 "believe" "" ;
--lin believe629 = regV2 "believe" "" ;
lin bell630 = regN "bell" ;
lin belong631 = regV2 "belong" "" ;
lin beloved632 = regA "beloved" ;
lin beloved633 = regA "beloved" ;
--lin beloved633 = regA "beloved" ;
lin belt635 = regN "belt" ;
lin bench636 = regN "bench" ;
lin bend637 = regV "bend" ;
lin beneficial639 = regA "beneficial" ;
lin beneficial640 = regA "beneficial" ;
--lin beneficial640 = regA "beneficial" ;
lin benefit641 = regN "benefit" ;
lin berry644 = regN "berry" ;
lin bet648 = regN "bet" ;
@@ -549,14 +552,14 @@ lin bibliography658 = regN "bibliography" ;
lin biconditional659 = regV "biconditional" ;
lin bicycle660 = regN "bicycle" ;
lin bidirectional661 = regA "bidirectional" ;
lin big662 = regA "big" ;
lin big662 = regA "big" ;--
lin bike663 = regN "bike" ;
lin bill664 = regN "bill" ;
lin bill665 = regN "bill" ;
--lin bill665 = regN "bill" ;
lin billion666 = regN "billion" ;
lin bin667 = regN "bin" ;
lin binary668 = regA "binary" ;
lin bind669 = regV2 "bind" "" ;
--lin bind669 = regV2 "bind" "" ;
lin binding670 = regN "binding" ;
lin bird671 = regN "bird" ;
lin birth672 = regN "birth" ;
@@ -564,7 +567,7 @@ lin birthday673 = regN "birthday" ;
lin bisect674 = regV "bisect" ;
lin bisector675 = regN "bisector" ;
lin bit676 = regN "bit" ;
lin bite678 = regV2 "bite" "" ;
--lin bite678 = regV2 "bite" "" ;
lin bitter680 = regA "bitter" ;
lin bizarre682 = regA "bizarre" ;
lin black683 = regA "black" ;
@@ -572,7 +575,7 @@ lin blackboard684 = regN "blackboard" ;
lin blade685 = regN "blade" ;
lin blame686 = regV3 "blame" "" "for" ;
lin blame687 = regN "blame" ;
lin blame688 = regN "blame" ;
--lin blame688 = regN "blame" ;
lin blank689 = regA "blank" ;
lin blank690 = regN "blank" ;
lin bleed693 = regV "bleed" ;
@@ -582,7 +585,7 @@ lin block697 = regN "block" ;
lin block698 = regV2 "block" "" ;
lin blood699 = regN "blood" ;
lin blow700 = regN "blow" ;
lin blow701 = regV "blow" ;
--lin blow701 = regV "blow" ;
lin blue703 = regA "blue" ;
lin bluff704 = regV2 "bluff" "" ;
lin board705 = regN "board" ;
@@ -612,7 +615,7 @@ lin borrow731 = regV3 "borrow" "" "from" ;
lin boss732 = regN "boss" ;
lin both735 = regA "both" ;
lin bother736 = regV "bother" ;
lin bother737 = regV "bother" ;
--lin bother737 = regV "bother" ;
lin bother738 = regV2 "bother" "" ;
lin bother739 = regV2 "bother" "about" ;
lin bottle740 = regN "bottle" ;
@@ -640,12 +643,12 @@ lin breach765 = regV2 "breach" "" ;
lin bread766 = regN "bread" ;
lin breadth767 = regN "breadth" ;
lin break768 = regN "break" ;
lin break769 = regV2 "break" "" ;
--lin break769 = regV2 "break" "" ;
lin breakage770 = regN "breakage" ;
lin breakfast771 = regN "breakfast" ;
lin breath772 = regN "breath" ;
lin breathe773 = regV2 "breathe" "" ;
lin breed774 = regV "breed" ;
--lin breed774 = regV "breed" ;
lin breed775 = regN "breed" ;
lin breeze776 = regN "breeze" ;
lin brew777 = regV2 "brew" "" ;
@@ -656,7 +659,7 @@ lin brief781 = regA "brief" ;
lin briefs782 = regN "briefs" ;
lin bright783 = regA "bright" ;
lin brilliant785 = regA "brilliant" ;
lin bring786 = regV2 "bring" "" ;
--lin bring786 = regV2 "bring" "" ;
lin bristle787 = regN "bristle" ;
lin britain788 = regN "britain" ;
lin british789 = regA "british" ;
@@ -665,18 +668,18 @@ lin broad791 = regA "broad" ;
lin broadcast792 = regN "broadcast" ;
lin bronchitis795 = regN "bronchitis" ;
lin brother796 = regN "brother" ;
lin brother797 = regN "brother" ;
--lin brother797 = regN "brother" ;
lin brown800 = regA "brown" ;
lin bruise801 = regN "bruise" ;
lin bruise802 = regV2 "bruise" "" ;
lin brute803 = regN "brute" ;
lin bucket804 = regN "bucket" ;
lin bud805 = regN "bud" ;
lin bud806 = regV2 "bud" "" ;
lin bud806 = regV2 "bud" "" ;--
lin buffer807 = regN "buffer" ;
lin buffer808 = regV2 "buffer" "" ;
lin bug809 = regN "bug" ;
lin build810 = regV2 "build" "" ;
--lin build810 = regV2 "build" "" ;
lin building811 = regN "building" ;
lin bullet814 = regN "bullet" ;
lin bully815 = regN "bully" ;
@@ -685,9 +688,9 @@ lin bun817 = regN "bun" ;
lin bunch818 = regN "bunch" ;
lin bundle819 = regN "bundle" ;
lin burden820 = regN "burden" ;
lin burn821 = regV2 "burn" "" ;
--lin burn821 = regV2 "burn" "" ;
lin burst825 = regV "burst" ;
lin burst826 = regV "burst" ;
--lin burst826 = regV "burst" ;
lin bury827 = regV2 "bury" "" ;
lin bus828 = regN "bus" ;
lin bush829 = regN "bush" ;
@@ -697,8 +700,9 @@ lin butter833 = regN "butter" ;
lin butter834 = regV2 "butter" "" ;
lin butterfly835 = regN "butterfly" ;
lin button836 = regN "button" ;
lin buy837 = regV2 "buy" "" ;
--lin buy837 = regV2 "buy" "" ;
lin buzz838 = regV "buzz" ;
lin cabinet842 = regN "cabinet" ;
lin cable843 = regN "cable" ;
lin cage844 = regN "cage" ;
@@ -2558,13 +2562,13 @@ lin hasty2848 = regA "hasty" ;
lin hat2849 = regN "hat" ;
lin hate2850 = regV2 "hate" "" ;
lin hatred2851 = regN "hatred" ;
lin have2852 = regV2 "have" "" ;
lin have2853 = regV2 "have" "" ;
--lin have2852 = regV2 "have" "" ;
--lin have2853 = regV2 "have" "" ;
lin haven2854 = regN "haven" ;
lin having2857 = regV "having" ;
lin hazard2858 = regN "hazard" ;
lin haze2859 = regN "haze" ;
lin he2860 = regN "he" ;
--lin he2860 = regN "he" ;
lin head2861 = regN "head" ;
lin head2862 = regV2 "head" "" ;
lin heading2863 = regN "heading" ;
@@ -2697,7 +2701,7 @@ lin hypotheses3015 = regN "hypotheses" ;
lin hypothesis3016 = regN "hypothesis" ;
lin hypothesize3017 = regV2 "hypothesize" "" ;
lin hypothetical3018 = regA "hypothetical" ;
lin i3019 = regN "i" ;
--lin i3019 = regN "i" ;
lin ice3021 = regN "ice" ;
lin iceland3022 = regN "iceland" ;
lin icelandic3023 = regA "icelandic" ;
@@ -2705,7 +2709,7 @@ lin icon3024 = regN "icon" ;
lin idea3025 = regN "idea" ;
lin ideal3026 = regA "ideal" ;
lin identical3027 = regA "identical" ;
lin identical3028 = regA "identical" ;
--lin identical3028 = regA "identical" ;
lin identify3029 = regV2 "identify" "" ;
lin identity3030 = regN "identity" ;
lin idiocy3031 = regN "idiocy" ;
@@ -3011,8 +3015,8 @@ lin isolate3357 = regV2 "isolate" "" ;
lin isomorphic3358 = regA "isomorphic" ;
lin issue3359 = regV "issue" ;
lin issue3360 = regN "issue" ;
lin it3362 = regN "it" ;
lin it3363 = regN "it" ;
--lin it3362 = regN "it" ;
--lin it3363 = regN "it" ;
lin italy3364 = regN "italy" ;
lin item3365 = regN "item" ;
lin itemize3366 = regV2 "itemize" "" ;
@@ -4849,7 +4853,7 @@ lin shave5364 = regN "shave" ;
lin shave5365 = regV2 "shave" "" ;
lin shave5366 = regV2 "shave" "" ;
lin shaven5367 = regA "shaven" ;
lin she5368 = regN "she" ;
--lin she5368 = regN "she" ;
lin shear5369 = regV2 "shear" "" ;
lin shears5370 = regN "shears" ;
lin shed5371 = regN "shed" ;
@@ -5464,8 +5468,8 @@ lin text6069 = regN "text" ;
lin textbook6070 = regN "textbook" ;
lin thank6072 = regV2 "thank" "" ;
lin thanks6073 = regN "thanks" ;
lin that6077 = regN "that" ;
lin that6078 = regN "that" ;
--lin that6077 = regN "that" ;
--lin that6078 = regN "that" ;
lin theatre6080 = regN "theatre" ;
lin theatrical6081 = regA "theatrical" ;
lin thematic6085 = regA "thematic" ;
@@ -5850,7 +5854,7 @@ lin wave6527 = regV2 "wave" "to" ;
lin wave6528 = regN "wave" ;
lin wax6529 = regN "wax" ;
lin way6530 = regN "way" ;
lin we6531 = regN "we" ;
--lin we6531 = regN "we" ;
lin weak6532 = regA "weak" ;
lin wealth6533 = regN "wealth" ;
lin weapon6534 = regN "weapon" ;
@@ -5936,7 +5940,7 @@ lin work6668 = regV "work" ;
lin world6669 = regN "world" ;
lin worm6670 = regN "worm" ;
lin worry6672 = regV "worry" ;
lin worry6673 = regV "worry" ;
--lin worry6673 = regV "worry" ;
lin worry6674 = regV2 "worry" "" ;
lin worry6675 = regV2 "worry" "about" ;
lin worry6676 = regN "worry" ;
@@ -5944,7 +5948,7 @@ lin worship6678 = regV2 "worship" "" ;
lin worthless6681 = regA "worthless" ;
lin worthwhile6682 = regA "worthwhile" ;
lin worthy6683 = regA "worthy" ;
lin worthy6684 = regA "worthy" ;
--lin worthy6684 = regA "worthy" ;
lin would6685 = regV "would" ;
lin wound6689 = regV2 "wound" "" ;
lin wound6692 = regN "wound" ;
@@ -5953,7 +5957,7 @@ lin wreck6696 = regV2 "wreck" "" ;
lin wreck6697 = regN "wreck" ;
lin wrinkle6698 = regN "wrinkle" ;
lin wrist6699 = regN "wrist" ;
lin write6700 = regV2 "write" "" ;
--lin write6700 = regV2 "write" "" ;
lin wrong6702 = regA "wrong" ;
lin wry6704 = regA "wry" ;
lin yard6706 = regN "yard" ;
@@ -5963,7 +5967,7 @@ lin yellow6709 = regA "yellow" ;
lin yet6711 = mkAdv "yet" ;
lin yield6712 = regV2 "yield" "" ;
lin yield6713 = regN "yield" ;
lin you6714 = regN "you" ;
--lin you6714 = regN "you" ;
lin young6715 = regA "young" ;
lin youth6720 = regN "youth" ;
lin zero6721 = regA "zero" ;

26
examples/big/MkDict.hs Normal file
View File

@@ -0,0 +1,26 @@
infile = "mywordlist1"
main = do
s <- readFile infile
mapM_ (putStrLn . mkOne) $ lines s
mkOne s = case words s of
"--":_ -> ""
('(':_):w:cat:ws ->
let
(c,f) = mkCatf (nopar cat) (more ws)
in unwords $ [c, f, w]
_ -> "-- " ++ s
where
more ws = case ws of
_ | elem "(REG" ws -> "irreg"
_ -> "reg"
nopar = filter (flip notElem "()")
mkCatf c r = case c of
"Noun" -> ("N","regN")
"Adject" -> ("A","regA")
"Adject_LONG" -> ("A","longA")
"Verb" -> ("V","regV")
"PNoun" -> ("PN","regPN")
_ -> (c,"mk" ++ c)

6112
examples/big/mywordlist1 Normal file

File diff suppressed because it is too large Load Diff