mirror of
https://github.com/GrammaticalFramework/gf-core.git
synced 2026-04-23 11:42:49 -06:00
pronunciation variant of LangThai (still buggy)
This commit is contained in:
@@ -18,7 +18,7 @@ lin
|
|||||||
-- bank_N = regN "bank" ;
|
-- bank_N = regN "bank" ;
|
||||||
-- beautiful_A = regADeg "beautiful" ;
|
-- beautiful_A = regADeg "beautiful" ;
|
||||||
-- become_VA = mkVA (irregV "become" "became" "become") ;
|
-- become_VA = mkVA (irregV "become" "became" "become") ;
|
||||||
-- beer_N = regN "beer" ;
|
beer_N = mkN biar_s kew_s ;
|
||||||
-- beg_V2V = mkV2V (regDuplV "beg") noPrep toP ;
|
-- beg_V2V = mkV2V (regDuplV "beg") noPrep toP ;
|
||||||
big_A = ss yay_s ;
|
big_A = ss yay_s ;
|
||||||
-- bike_N = regN "bike" ;
|
-- bike_N = regN "bike" ;
|
||||||
@@ -64,7 +64,7 @@ lin
|
|||||||
-- doctor_N = regN "doctor" ;
|
-- doctor_N = regN "doctor" ;
|
||||||
-- dog_N = regN "dog" ;
|
-- dog_N = regN "dog" ;
|
||||||
-- door_N = regN "door" ;
|
-- door_N = regN "door" ;
|
||||||
-- drink_V2 = dirV2 (irregV "drink" "drank" "drunk") ;
|
drink_V2 = dirV2 (regV dvm_s) ;
|
||||||
-- easy_A2V = mkA2V (regA "easy") forP ;
|
-- easy_A2V = mkA2V (regA "easy") forP ;
|
||||||
-- eat_V2 = dirV2 (irregV "eat" "ate" "eaten") ;
|
-- eat_V2 = dirV2 (irregV "eat" "ate" "eaten") ;
|
||||||
-- empty_A = regADeg "empty" ;
|
-- empty_A = regADeg "empty" ;
|
||||||
@@ -206,7 +206,7 @@ lin
|
|||||||
-- window_N = regN "window" ;
|
-- window_N = regN "window" ;
|
||||||
-- wine_N = regN "wine" ;
|
-- wine_N = regN "wine" ;
|
||||||
-- win_V2 = dirV2 (irregDuplV "win" "won" "won") ;
|
-- win_V2 = dirV2 (irregDuplV "win" "won" "won") ;
|
||||||
woman_N = mkN yig_s khon_s ;
|
woman_N = mkN (puu_s ++ yig_s) khon_s ;
|
||||||
-- wonder_VQ = mkVQ (regV "wonder") ;
|
-- wonder_VQ = mkVQ (regV "wonder") ;
|
||||||
-- wood_N = regN "wood" ;
|
-- wood_N = regN "wood" ;
|
||||||
-- write_V2 = dirV2 (irregV "write" "wrote" "written") ;
|
-- write_V2 = dirV2 (irregV "write" "wrote" "written") ;
|
||||||
|
|||||||
@@ -1,2 +1,4 @@
|
|||||||
strings:
|
strings:
|
||||||
runghc -i../../../src FileThai.hs StringsThai.gf >StringsTha.gf
|
runghc -i../../../src FileThai.hs StringsThai.gf >StringsTha.gf
|
||||||
|
pronstrings:
|
||||||
|
runghc -i../../../src FileThai.hs -p StringsThai.gf >pronunciation/StringsTha.gf
|
||||||
|
|||||||
@@ -30,7 +30,7 @@ concrete NounTha of Noun = CatTha ** open StringsTha, ResTha, Prelude in {
|
|||||||
hasC = quant.hasC ;
|
hasC = quant.hasC ;
|
||||||
} ;
|
} ;
|
||||||
DetPl quant num ord = {
|
DetPl quant num ord = {
|
||||||
s1 = [] ;
|
s1 = num.s ;
|
||||||
s2 = quant.s ++ ord.s ;
|
s2 = quant.s ++ ord.s ;
|
||||||
hasC = orB num.hasC quant.hasC ;
|
hasC = orB num.hasC quant.hasC ;
|
||||||
} ;
|
} ;
|
||||||
@@ -59,8 +59,8 @@ concrete NounTha of Noun = CatTha ** open StringsTha, ResTha, Prelude in {
|
|||||||
DefArt = {s = [] ; hasC = False} ;
|
DefArt = {s = [] ; hasC = False} ;
|
||||||
IndefArt = {s = [] ; hasC = False} ;
|
IndefArt = {s = [] ; hasC = False} ;
|
||||||
|
|
||||||
-- MassDet = {s = [] ; n = Sg} ;
|
MassDet = {s = [] ; hasC = False} ;
|
||||||
--
|
|
||||||
UseN n = n ;
|
UseN n = n ;
|
||||||
-- UseN2 n = n ;
|
-- UseN2 n = n ;
|
||||||
-- UseN3 n = n ;
|
-- UseN3 n = n ;
|
||||||
|
|||||||
@@ -9,22 +9,17 @@ Literal strings are defined as constants, all in the generated file
|
|||||||
|
|
||||||
StringsTha.gf
|
StringsTha.gf
|
||||||
|
|
||||||
This file is obtained from
|
This file is obtained by 'make strings' from
|
||||||
|
|
||||||
StringsThai.gf
|
StringsThai.gf
|
||||||
|
|
||||||
by
|
using the transliteration defined in GF/src/GF/Text/Thai.hs
|
||||||
|
and documented in thai.html.
|
||||||
make strings
|
|
||||||
|
|
||||||
using the transliteration defined in
|
|
||||||
|
|
||||||
GF/src/GF/Text/Thai.hs
|
|
||||||
|
|
||||||
and documented in
|
|
||||||
|
|
||||||
thai.html
|
|
||||||
|
|
||||||
From this, also approximate pronunciation can be derived.
|
From this, also approximate pronunciation can be derived.
|
||||||
We also plan to use this unique word list for segmenting
|
Use then the command 'make pronstrings' and the main file
|
||||||
|
|
||||||
|
LangThaiPron.gf
|
||||||
|
|
||||||
|
We also plan to use the unique word list for segmenting
|
||||||
Thai strings.
|
Thai strings.
|
||||||
|
|||||||
@@ -7,15 +7,18 @@ resource StringsTha = {
|
|||||||
oper
|
oper
|
||||||
|
|
||||||
baan_s = "บ้าน" ; -- house
|
baan_s = "บ้าน" ; -- house
|
||||||
|
biar_s = "เบีอร์" ;
|
||||||
ca_s = "จะ" ; -- Modal
|
ca_s = "จะ" ; -- Modal
|
||||||
cet_s = "เจ็ด" ; -- seven
|
cet_s = "เจ็ด" ; -- seven
|
||||||
chan_s = "ฉัน" ; -- I
|
chan_s = "ฉัน" ; -- I
|
||||||
chay_s = "ไช่" ; -- be-not
|
chay_s = "ไช่" ; -- be-not
|
||||||
|
dvm_s = "ดึม" ; -- drink
|
||||||
et_s = "เอ็ด" ; -- one'
|
et_s = "เอ็ด" ; -- one'
|
||||||
haa_s = "ห้า" ; -- five
|
haa_s = "ห้า" ; -- five
|
||||||
hay_s = "ให้" ; -- give
|
hay_s = "ให้" ; -- give
|
||||||
hok_s = "หก" ; -- six
|
hok_s = "หก" ; -- six
|
||||||
kaaw_s = "เกา" ; -- nine
|
kaaw_s = "เกา" ; -- nine
|
||||||
|
kew_s = "แก้ว" ; -- glass (drink Classif)
|
||||||
khaw_s = "เขว" ; -- he
|
khaw_s = "เขว" ; -- he
|
||||||
khon_s = "คน" ; -- people Classif
|
khon_s = "คน" ; -- people Classif
|
||||||
khoog_s = "ของ" ; -- Possessive
|
khoog_s = "ของ" ; -- Possessive
|
||||||
|
|||||||
@@ -7,15 +7,18 @@ resource StringsTha = {
|
|||||||
oper
|
oper
|
||||||
|
|
||||||
baan_s = "bT2a:n" ; -- house
|
baan_s = "bT2a:n" ; -- house
|
||||||
|
biar_s = "ebi:OrK" ;
|
||||||
ca_s = "ca." ; -- Modal
|
ca_s = "ca." ; -- Modal
|
||||||
cet_s = "ecSd" ; -- seven
|
cet_s = "ecSd" ; -- seven
|
||||||
chan_s = "c1an" ; -- I
|
chan_s = "c1an" ; -- I
|
||||||
chay_s = "a&c2T1" ; -- be-not
|
chay_s = "a&c2T1" ; -- be-not
|
||||||
|
dvm_s = "dvm" ; -- drink
|
||||||
et_s = "eOSd" ; -- one'
|
et_s = "eOSd" ; -- one'
|
||||||
haa_s = "hT2a:" ; -- five
|
haa_s = "hT2a:" ; -- five
|
||||||
hay_s = "a%hT2" ; -- give
|
hay_s = "a%hT2" ; -- give
|
||||||
hok_s = "ho?k" ; -- six
|
hok_s = "ho?k" ; -- six
|
||||||
kaaw_s = "eka:" ; -- nine
|
kaaw_s = "eka:" ; -- nine
|
||||||
|
kew_s = "e'kT2w" ; -- glass (drink Classif)
|
||||||
khaw_s = "ek1w" ; -- he
|
khaw_s = "ek1w" ; -- he
|
||||||
khon_s = "k2n" ; -- people Classif
|
khon_s = "k2n" ; -- people Classif
|
||||||
khoog_s = "k1Og" ; -- Possessive
|
khoog_s = "k1Og" ; -- Possessive
|
||||||
|
|||||||
62
lib/resource-1.0/thai/pronunciation/StringsTha.gf
Normal file
62
lib/resource-1.0/thai/pronunciation/StringsTha.gf
Normal file
@@ -0,0 +1,62 @@
|
|||||||
|
-- The only place where literal Thai strings are defined
|
||||||
|
-- (except for Lexicon and Structural).
|
||||||
|
-- Convert this into StringsThai by 'make strings'
|
||||||
|
|
||||||
|
resource StringsTha = {
|
||||||
|
|
||||||
|
oper
|
||||||
|
|
||||||
|
baan_s = "b^aan" ; -- house
|
||||||
|
biar_s = "b-eiiO" ;
|
||||||
|
ca_s = "c`a" ; -- Modal
|
||||||
|
cet_s = "c`et" ; -- seven
|
||||||
|
chan_s = "ch~an" ; -- I
|
||||||
|
chay_s = "ch^ay" ; -- be-not
|
||||||
|
dvm_s = "d-vm" ; -- drink
|
||||||
|
et_s = "O`et" ; -- one'
|
||||||
|
haa_s = "h^aa" ; -- five
|
||||||
|
hay_s = "h^ay" ; -- give
|
||||||
|
hok_s = "k`o" ; -- six
|
||||||
|
kaaw_s = "k-eaa" ; -- nine
|
||||||
|
kew_s = "k^äw" ; -- glass (drink Classif)
|
||||||
|
khaw_s = "kh`ew" ; -- he
|
||||||
|
khon_s = "kh-on" ; -- people Classif
|
||||||
|
khoog_s = "kh~Og" ; -- Possessive
|
||||||
|
khun_s = "kh-un" ; -- you
|
||||||
|
lag_s = "l~ag" ; -- houses Classif
|
||||||
|
lap_s = "l`ap" ; -- sleep2
|
||||||
|
lem_s = "l^em" ; -- books Classif
|
||||||
|
may_s = "m-ay" ; -- not
|
||||||
|
m'ay_s = "m~ay" ; -- Question
|
||||||
|
mvvn_s = "m`vvn" ; -- ten thousand
|
||||||
|
nag_s = "n~ag" ; -- book1
|
||||||
|
nan_s = "n~an" ; -- that
|
||||||
|
noon_s = "n-On" ; -- sleep1
|
||||||
|
nvg_s = "n~vg" ; -- one
|
||||||
|
pay_s = "p-ay" ; -- go
|
||||||
|
peet_s = "p`ät" ; -- eight
|
||||||
|
pen_s = "p-en" ; -- be, can-know
|
||||||
|
phan_s = "ph-an" ; -- thousand
|
||||||
|
puu_s = "ph^uu" ; -- woman1
|
||||||
|
rak_s = "r'ak" ; -- love
|
||||||
|
raw_s = "r-eaa" ; -- we
|
||||||
|
rooy_s = "r~Oy" ; -- hundred
|
||||||
|
saam_s = "s~aam" ; -- three
|
||||||
|
seen_s = "s~än" ; -- hundred thousand
|
||||||
|
si_s = "s'i" ; -- Imperative
|
||||||
|
sii_s = "s`ii" ; -- four
|
||||||
|
sip_s = "s`ip" ; -- ten
|
||||||
|
soog_s = "s~Og" ; -- two
|
||||||
|
svv_s = "s~vvO" ; -- book2
|
||||||
|
thii_s = "th^ii" ; -- Ord
|
||||||
|
tog_s = "t^Og" ; -- must
|
||||||
|
waa_s = "w^aa" ; -- that Conj
|
||||||
|
way_s = "w~ay" ; -- can-potent
|
||||||
|
yaa_s = "O`aay" ; -- Neg Imper
|
||||||
|
yaak_s = "O`aayk" ; -- want
|
||||||
|
yay_s = "y~ay" ; -- big
|
||||||
|
yig_s = "y~ig" ; -- woman2
|
||||||
|
yii_s = "y^ii" ; -- two'
|
||||||
|
|
||||||
|
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user