forked from GitHub/gf-core
preparing a new DictEngFin from WN data
This commit is contained in:
13
lib/src/finnish/stemmed/ElimPredef.hs
Normal file
13
lib/src/finnish/stemmed/ElimPredef.hs
Normal file
@@ -0,0 +1,13 @@
|
||||
import qualified Data.Set as S
|
||||
|
||||
-- comment out words that are predefined in another lexicon
|
||||
-- runghc ElimPredef.hs <DictEngFin.gf
|
||||
|
||||
main = do
|
||||
predefs <- readFile "predef.txt" >>= return . S.fromList . map (head . words) . lines
|
||||
interact (unlines . map (elimPredef predefs) . lines)
|
||||
|
||||
elimPredef predefs line = case words line of
|
||||
w:_ | S.member w predefs -> "--PREDEF " ++ line
|
||||
_ -> line
|
||||
|
||||
Reference in New Issue
Block a user