eSpeak NG is an open source speech synthesizer that supports more than hundred languages and accents.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

smj_rules 7.8KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282
  1. // SMJ translation rules
  2. // This file is UTF-8 encoded
  3. // _) a // "a" at the start of a word
  4. // a (CC // "a" followed by two consonants
  5. // a (C% // "a" followed by a double consonant (the same letter twice)
  6. // a (/% // "a" followed by a percent sign
  7. // %C) a // "a" preceded by a double consonants
  8. // @@) bi // "bi" preceded by at least two syllables
  9. // @@a) bi // "bi" preceded by at least 2 syllables and following 'a'
  10. // START SMJ HERE
  11. // groups
  12. //.L01 i j // used in palatalization rules
  13. .L01 b d g k p t // Plosives
  14. .L02 r l j v // Sonorants
  15. //.L02 b d f g h j l m n r s v
  16. //.L03 l m n r
  17. //.L04 a b c d e f g h i j k l m n o p q r s t u v õ ä ö ü
  18. //.L05 a e i l m n o r u õ ä ö ü
  19. // Epenthetic vowels in Q3 consonant clusters
  20. // r l j v followed by homorganic consonants (geminates)
  21. // barggo, dárbbo, tjoarvve, girjje, álggo, galbba, gålmmå, dálvve, nijbbe, bievdde
  22. // separate rules for all cons. clusters and vowel nucleai?
  23. // a (L02%C // possible to generalize?
  24. // A) rgg r@^g // Any vowel + schwaa - more general?
  25. //Orthographically homonymous Q3: f, l, m, n, nj, ń, ñ, ŋ, r, s, sj, v
  26. // After numeral 1 -- Q3; after any numeral <1 -- Q2?
  27. // akta @) ff ff:
  28. // Word order? -- Impossible to have a syntactic disambiguator in Espeak to recognize homonymous sg.nom & sg.gen forms...
  29. // OR if adjusted orthography would be used, e.g.: f'f/fff ff:
  30. // Vowel compensation/readjustment: V1 and V2 longest in Q1, gradually decreasing in length, but differences very small/not significant.
  31. .group a
  32. // a A
  33. a (@ A // back vowel
  34. @) a a:
  35. artihkal ar.t'ihkAl
  36. %CC) a A // short after Q3 consonant/cluster
  37. .group á
  38. %CC) á a // short after Q3 consonant/cluster
  39. á (@ A: //
  40. @) á a: // in 2nd syll
  41. C) á A: // after Q1 (single) consonant
  42. .group ä
  43. ä (@ &
  44. ä &: //
  45. // ä i& // in Sweden
  46. ä e& // in Sweden
  47. .group æ // same as ä
  48. æ (@ &
  49. æ &: //
  50. // æ i& // in Sweden
  51. æ e& // in Sweden
  52. %CC) æ & // short after Q3 consonant/cluster
  53. .group å
  54. å O
  55. @) å O: // in 2nd syll
  56. %CC) å O // short after Q3 consonant/cluster
  57. .group b
  58. b p
  59. A) b (A b // voiced in an intervocalic position
  60. bb b: // voiced within a geminate
  61. bussa p'u-s:A // Scandinavian loanword
  62. .group c
  63. c ts
  64. .group d
  65. d t
  66. dal dAl
  67. A) d (A d // voiced in an intervocalic position
  68. dd d:
  69. dj c // palatal plosive
  70. A) dj (A J\ // voiced palatal plosive between vowels
  71. A) ddj (A J\: // voiced palatal plosive between vowels
  72. dts dz // [d͡z]
  73. dtj dZ // [d͡ʒ]
  74. .group e
  75. e (@ E: // open-mid
  76. e (_ iE // open 2nd syll
  77. @) e iE // in 2nd syll
  78. e E // other environments
  79. .group f
  80. f f
  81. ff f:
  82. // akta @) ff (A ff: // (Q3/sg.nom when with numeral 1)
  83. .group g
  84. g k
  85. A) g (A g // voiced in an intervocalic position
  86. gg g:
  87. .group h
  88. h h
  89. hk hk
  90. hkk k: // [h] not audible in Q3 cons. cluster
  91. hp hp
  92. hpp p: // [h] not audible in Q3 cons. cluster
  93. ht ht
  94. htt t: // [h] not audible in Q3 cons. cluster
  95. hts hts
  96. htts h:ts
  97. htj htS
  98. httj ht:S
  99. .group i
  100. i i: // can be long as well?
  101. ie (@ iE
  102. %CC) i i // short after Q3 consonant
  103. .group j
  104. j j
  105. ja ja
  106. i) jbb jIb
  107. journalissta Sur.nal'isstA
  108. .group k
  109. k k
  110. k (á kh // Aspirated in Scandinavian loanwords, like this?
  111. káffa kh'A:f:A
  112. kásus kh'A:su-s
  113. kássa kh'A:S:A
  114. kk k:
  115. .group l
  116. l l // Can be a copula itself
  117. ll l:
  118. // akta @) ll (A ll: // (Q3/sg.nom when with numeral 1)
  119. á) lgg lAg // Q3
  120. a) lbb lab // Q3
  121. u) lpp lub // Q3
  122. á) lmm lAm // Q3
  123. á) lvv lAv // Q3
  124. .group m
  125. m m
  126. mm m:
  127. // akta @) mm (A mm: // (Q3/sg.nom when with numeral 1)
  128. .group n
  129. n n
  130. nj n_j
  131. nnj n_j:
  132. // akta @) nnj (A nn_j: // (Q3/sg.nom when with numeral 1)
  133. .group ñ
  134. ñ N
  135. ññ N:
  136. // akta @) ññ (A NN: // (Q3/sg.nom when with numeral 1)
  137. .group ń
  138. ń N
  139. ńń N:
  140. // akta @) ńń (A NN: // (Q3/sg.nom when with numeral 1)
  141. .group ŋ
  142. ŋ N
  143. ŋŋ N:
  144. // akta @) ŋŋ (A NN: // (Q3/sg.nom when with numeral 1)
  145. .group o
  146. o oO
  147. @) o uo
  148. oa ua //
  149. oa (@ oA //
  150. .group ö
  151. %CC) ö Y
  152. ö Y: //
  153. .group ø
  154. %CC) ø Y
  155. ø Y: //
  156. .group p
  157. p p
  158. p (á ph // Aspirated in Scandinavian loanwords
  159. pp p:
  160. parlamænnta par.lAm'&ntA
  161. .group r
  162. r r
  163. rd rt
  164. rl rl
  165. // rl l. // Retroflex. in Scandinavian loanwords
  166. rn rn
  167. // rn n. // Retroflex. in Scandinavian loanwords
  168. rt rt
  169. // rt t. // Retroflex. in Scandinavian loanwords
  170. a) rgg rag // Q3
  171. e) rgg reg // Q3
  172. æ) rgg r&g // Q3
  173. a) rvv rav // Q3
  174. á) rbb rAb // Q3
  175. i) rjj rij // Q3
  176. u) rŋŋ ruN // Q3
  177. rr r:
  178. // akta @) rr (A rr: // (Q3/sg.nom when with numeral 1)
  179. .group s
  180. s s
  181. ss s:
  182. // akta @) ss (A ss: // (Q3/sg.nom when with numeral 1)
  183. sj S
  184. ssj S: // Q2 or Q3
  185. // akta @) ssj (A SS: // (Q3/sg.nom when with numeral 1)
  186. .group t
  187. t t
  188. t (á th // Aspirated in Scandinavian loanwords
  189. t (_ ht // at the end of a word
  190. tt t:
  191. tj tS // voiceless alveo-palatal fricative in Sweden
  192. ts ts // voiceless alveo-palatal fricative in Sweden e.g. <subtsas>
  193. tts ts:
  194. .group u
  195. u u
  196. uo (@ uo
  197. // u u: //
  198. // u U- //
  199. // u u- // in newish Scand. loanwords like <komuvnna>
  200. // List some of most common scand. loanwords?
  201. .group v
  202. v v
  203. vv v:
  204. L01) v f // before a plosive
  205. v (_ P // in the end of a word, e.g. 1sg suffix
  206. e) vdd ved // Q3
  207. i) vdd vid // Q3
  208. å) vdd vOd // Q3
  209. // akta @) vv (A vv: // (Q3/sg.nom when with numeral 1)
  210. .group w
  211. w v
  212. .group x
  213. x ks
  214. xx k:s
  215. .group y
  216. y y
  217. .group z
  218. z ts
  219. zz t:s // pizza
  220. K) zh Z