1
0
forked from GitHub/gf-core

uniform encoding: gfo and pgf in UTF8, internal in unicode

This commit is contained in:
aarne
2008-06-26 16:35:45 +00:00
parent 712717e461
commit 7f9a0cdd34
41 changed files with 159 additions and 73 deletions

View File

@@ -19,21 +19,21 @@ import System
langsCoding = [
(("arabic", "Ara"),""),
(("bulgarian","Bul"),"from_cp1251,to_utf8"),
(("catalan", "Cat"),"to_utf8"),
(("danish", "Dan"),"to_utf8"),
(("bulgarian","Bul"),""),
(("catalan", "Cat"),""),
(("danish", "Dan"),""),
(("english", "Eng"),""),
(("finnish", "Fin"),"to_utf8"),
(("french", "Fre"),"to_utf8"),
(("hindi", "Hin"),"to_devanagari,to_utf8"),
(("german", "Ger"),"to_utf8"),
(("finnish", "Fin"),""),
(("french", "Fre"),""),
(("hindi", "Hin"),"to_devanagari"),
(("german", "Ger"),""),
(("interlingua","Ina"),""),
(("italian", "Ita"),"to_utf8"),
(("norwegian","Nor"),"to_utf8"),
(("italian", "Ita"),""),
(("norwegian","Nor"),""),
(("russian", "Rus"),""),
(("spanish", "Spa"),"to_utf8"),
(("swedish", "Swe"),"to_utf8"),
(("thai", "Tha"),"to_thai,to_utf8")
(("spanish", "Spa"),""),
(("swedish", "Swe"),""),
(("thai", "Tha"),"to_thai")
]
langs = map fst langsCoding

View File

@@ -1,4 +1,6 @@
concrete AdjectiveBul of Adjective = CatBul ** open ResBul, Prelude in {
flags coding=cp1251 ;
lin
PositA a = {
s = \\aform => a.s ! aform ;

View File

@@ -1,4 +1,6 @@
concrete AdverbBul of Adverb = CatBul ** open ResBul, Prelude in {
flags coding=cp1251 ;
lin
PositAdvAdj a = {s = a.adv} ;
ComparAdvAdj cadv a np = {

View File

@@ -3,4 +3,6 @@
concrete Bulgarian of BulgarianAbs =
LangBul,
ExtraBul
** {} ;
** {
flags coding=cp1251 ;
} ;

View File

@@ -3,4 +3,6 @@
abstract BulgarianAbs =
Lang,
ExtraBulAbs
** {} ;
** {
flags coding=cp1251 ;
} ;

View File

@@ -1,4 +1,6 @@
concrete CatBul of Cat = open ResBul, Prelude, (R = ParamX) in {
concrete CatBul of Cat = open ResBul, Prelude, (R = ParamX) in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -1,5 +1,7 @@
concrete ConjunctionBul of Conjunction =
CatBul ** open ResBul, Coordination, Prelude in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -1,5 +1,7 @@
concrete ExtraBul of ExtraBulAbs = CatBul **
open ResBul, Coordination, Prelude in {
flags coding=cp1251 ;
lin
PossIndefPron p = {

View File

@@ -1,4 +1,6 @@
abstract ExtraBulAbs = Extra ** {
flags coding=cp1251 ;
fun
-- Feminine variants of pronouns (those in $Structural$ are

View File

@@ -15,6 +15,8 @@ concrete GrammarBul of Grammar =
StructuralBul,
IdiomBul
** {
flags coding=cp1251 ;
flags startcat = Phr ; unlexer = text ; lexer = text ;

View File

@@ -1,4 +1,6 @@
concrete IdiomBul of Idiom = CatBul ** open Prelude, ParadigmsBul, ResBul in {
flags coding=cp1251 ;
flags optimize=all_subs ;
lin

View File

@@ -4,6 +4,8 @@ concrete LangBul of Lang =
GrammarBul,
LexiconBul
** {
flags coding=cp1251 ;
flags startcat = Phr ; unlexer = text ; lexer = text ; erasing = on ; coding = cp1251 ;

View File

@@ -2,6 +2,8 @@
concrete LexiconBul of Lexicon = CatBul **
open ParadigmsBul, ResBul, Prelude in {
flags coding=cp1251 ;
flags
optimize=values ;

View File

@@ -12,7 +12,9 @@ resource MorphoBul = ResBul ** open
Predef,
Prelude,
CatBul
in {
in {
flags coding=cp1251 ;
flags optimize=all ;

View File

@@ -4,7 +4,9 @@ resource MorphoFunsBul = open
Prelude,
CatBul,
MorphoBul
in {
in {
flags coding=cp1251 ;
oper
--2 Adverbs

View File

@@ -1,4 +1,6 @@
concrete NounBul of Noun = CatBul ** open ResBul, Prelude in {
concrete NounBul of Noun = CatBul ** open ResBul, Prelude in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -1,4 +1,6 @@
concrete NumeralBul of Numeral = CatBul ** open Prelude, ResBul in {
flags coding=cp1251 ;
lincat
Digit = {s : DForm => CardOrd => Str} ;

View File

@@ -3,7 +3,9 @@ resource ParadigmsBul = MorphoFunsBul ** open
Prelude,
MorphoBul,
CatBul
in {
in {
flags coding=cp1251 ;
oper
mkN001 : Str -> N ;
mkN001 base = let v0 = base

View File

@@ -1,4 +1,6 @@
concrete PhraseBul of Phrase = CatBul ** open Prelude, ResBul in {
flags coding=cp1251 ;
lin
PhrUtt pconj utt voc = {s = pconj.s ++ utt.s ++ voc.s} ;

View File

@@ -1,4 +1,6 @@
concrete QuestionBul of Question = CatBul ** open ResBul, Prelude in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -1,4 +1,6 @@
concrete RelativeBul of Relative = CatBul ** open ResBul in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -8,6 +8,8 @@
-- patterns needed for $Lex$.
resource ResBul = ParamX ** open Prelude in {
flags coding=cp1251 ;
flags optimize=all ;

View File

@@ -1,4 +1,6 @@
concrete SentenceBul of Sentence = CatBul ** open Prelude, ResBul in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -1,5 +1,7 @@
concrete StructuralBul of Structural = CatBul **
open MorphoBul, ParadigmsBul, Prelude in {
flags coding=cp1251 ;
flags optimize=all ;

View File

@@ -1,4 +1,6 @@
concrete TextBul of Text = CatBul ** {
flags coding=cp1251 ;
-- This will work for almost all languages except Spanish.

View File

@@ -1,4 +1,6 @@
concrete VerbBul of Verb = CatBul ** open Prelude, ResBul, ParadigmsBul in {
flags coding=cp1251 ;
flags optimize=all_subs ;

View File

@@ -18,6 +18,6 @@ concrete DemoRus of Demo =
LexiconRus
** {
flags startcat = Phr ; unlexer = text ; lexer = text ;
flags startcat = Phr ; unlexer = text ; lexer = text ; coding = utf8 ;
} ;

View File

@@ -4,7 +4,7 @@ lin
SymbPN i = {s = \\c => i.s ; g = Neutr} ; --- c
IntPN i = {s = \\c => i.s ; g = Neutr} ; --- c
FloatPN i = {s = \\c => i.s ; g = Neutr} ; --- c
NumPN i = {s = \\c => i.s ; g = Neutr} ; --- c
NumPN i = {s = i.s ! Neutr ; g = Neutr} ; --- c
CNIntNP cn i = {
s = \\c => cn.s ! Weak ! Sg ! Nom ++ i.s ;
@@ -17,14 +17,14 @@ lin
isPron = False
} ;
CNNumNP cn i = {
s = \\c => artDef ! (GSg cn.g) ! c ++ cn.s ! Weak ! Sg ! Nom ++ i.s ;
s = \\c => artDef ! (GSg cn.g) ! c ++ cn.s ! Weak ! Sg ! Nom ++ i.s ! Neutr ! c ;
a = agrP3 Sg ;
isPron = False
} ;
SymbS sy = {s = \\_ => sy.s} ;
SymbNum n = {s = n.s ; n = Pl ; isNum = True} ;
SymbNum n = {s = \\_,_ => n.s ; n = Pl ; isNum = True} ;
SymbOrd n = {s = \\_ => n.s ++ "."} ;

View File

@@ -1,3 +1,3 @@
concrete ExtraRus of ExtraRusAbs = CatRus ** {
flags coding=utf8 ;
}

View File

@@ -14,4 +14,4 @@ concrete GrammarRus of Grammar =
TextX,
StructuralRus,
IdiomRus
** { flags startcat = Phr ; unlexer = text ; lexer = text ;} ;
** { flags startcat = Phr ; unlexer = text ; lexer = text ; coding=utf8 ;} ;

View File

@@ -3,7 +3,7 @@
--
concrete IrregRus of IrregRusAbs = CatRus ** open ParadigmsRus in {
--
--flags optimize=values ;
flags optimize=values ; coding=utf8 ;
--
-- lin
-- awake_V = irregV "awake" "awoke" "awoken" ;

View File

@@ -2,7 +2,7 @@
concrete NounRus of Noun = CatRus ** open ResRus, Prelude, MorphoRus in {
flags optimize=all_subs ;
flags optimize=all_subs ; coding=utf8 ;
lin
DetCN kazhduj okhotnik = {

View File

@@ -2,6 +2,7 @@
concrete PhraseRus of Phrase = CatRus ** open Prelude, ResRus in {
flags coding=utf8 ;
lin
PhrUtt pconj utt voc = {s = pconj.s ++ utt.s ++ voc.s} ;

View File

@@ -2,7 +2,7 @@
concrete QuestionRus of Question = CatRus ** open ResRus, Prelude in {
flags optimize=all_subs ;
flags optimize=all_subs ; coding=utf8 ;
lin

View File

@@ -3,4 +3,4 @@
concrete Russian of RussianAbs =
LangRus,
ExtraRus
** {} ;
** {flags coding=utf8 ;} ;