From ae7f33bec015edfbf7393c2cc09a9803705107ae Mon Sep 17 00:00:00 2001 From: aarne Date: Sat, 4 Mar 2006 14:58:11 +0000 Subject: [PATCH] treebank creating script; duplicated consonants in LexiconEng --- resource-1.0/Makefile | 3 +++ resource-1.0/english/LexiconEng.gf | 14 +++++++------- resource-1.0/minimal/MinStructural.gf | 1 + resource-1.0/minimal/MinStructuralI.gf | 1 + resource-1.0/mkTreebank.gfs | 10 ++++++++++ 5 files changed, 22 insertions(+), 7 deletions(-) create mode 100644 resource-1.0/mkTreebank.gfs diff --git a/resource-1.0/Makefile b/resource-1.0/Makefile index 91e08f4d6..911744438 100644 --- a/resource-1.0/Makefile +++ b/resource-1.0/Makefile @@ -23,6 +23,9 @@ multimodal: compiled: cd .. ; tar cvfz compiled.tgz alltenses/ mathematical/ multimodal/ present/ +treebank: + gf " | wf min.xml +gt -depth=4 -cat=QS | tb -xml | grep -v "treebank>" | af min.xml +gt -depth=3 (UttImpSg ? ?) | tb -xml | grep -v "treebank>" | af min.xml +gt -depth=4 -cat=NP | tb -xml | grep -v "