eSpeak NG is an open source speech synthesizer that supports more than hundred languages and accents.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

ta_rules 2.8KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248
  1. // This file is UTF8 encoded
  2. // Spelling to phoneme rules for Tamil
  3. // B means a combining vowel sign, or a virama
  4. .replace
  5. ௦ 0 // Tamil numbers
  6. ௧ 1
  7. ௨ 2
  8. ௩ 3
  9. ௪ 4
  10. ௫ 5
  11. ௬ 6
  12. ௭ 7
  13. ௮ 8
  14. ௯ 9
  15. ொ ொ
  16. ோ ோ
  17. ௌ ௌ
  18. .group 0xe0ae // characters which start with UTF-8 bytes: [e0 ae]
  19. ஂ // anusvara
  20. ஃ // visarga
  21. அ a
  22. ஆ a:
  23. இ i
  24. ஈ i:
  25. உ u
  26. ஊ u:
  27. எ e
  28. _) எ ;e // add a short [j] sound at start of word ?
  29. ஏ e:
  30. _) ஏ ;e: // add a short [j] sound at start of word ?
  31. ஐ aI
  32. ஒ o
  33. ஓ o:
  34. ஔ aU
  35. // consonants
  36. க gV // inter-vocalic, unless there is virama before or after
  37. க (B g
  38. க (் g
  39. ்) க gV
  40. ்) க (B g
  41. _) க kV
  42. _) க (B k
  43. _) க (T gV // if word has $alt attribute in ta_list
  44. _) க (BT g // $alt
  45. க்க kkV
  46. க்க (B kk
  47. _) க (ௌ g
  48. க (ீத g
  49. க (ஜ gV
  50. _) க (ம்பீர gV
  51. _) க (ந்தர்வ gV
  52. _) க (ோவிந்த g
  53. ங NV
  54. ங (B N
  55. ச sV // ?? [z]
  56. ச (B s
  57. _) ச sa
  58. _) ச (B s
  59. ச்ச tS:V
  60. ச்ச (B tS:
  61. ற்ச tS:
  62. ற்ச (B tS:
  63. ட்) ச tSV
  64. ட்) ச (B tS
  65. ஞ்) ச dZV
  66. ஞ்) ச (B dZ
  67. ஜ dZV
  68. ஜ (B dZ
  69. ஞ n^V
  70. ஞ (B n^
  71. ட d.V
  72. ட (B d.
  73. _) ட t.V
  74. _) ட (B t.
  75. ட்ட t.t.V
  76. ட்ட (B t.t.
  77. ண n.V
  78. ண (B n.
  79. த dV
  80. த (B d
  81. _) த tV
  82. _) த (B t
  83. _) த (T dV // if word has $alt attribute in ta_list
  84. _) த (BT d // if word has $alt
  85. த்த ttV
  86. த்த (B tt
  87. // exceptions, த as [d]
  88. _) த (ன dV
  89. _) த (ர்ம dV
  90. _) த (ுர் d
  91. _) த (ூர d
  92. _) த (ெய்வ d
  93. _) த (ுஷ் d
  94. _) த (க்ஷிணா dV
  95. ந nV
  96. ந (B n // dental n
  97. ன nV
  98. ன (B n // alveolar n
  99. ப bV
  100. ப (B b
  101. _) ப pV
  102. _) ப (B p
  103. _) ப (T bV // if word has $alt attribute in ta_list
  104. _) ப (BT b // if word has $alt
  105. ப்ப ppV
  106. ப்ப (B pp
  107. ட்) ப pV
  108. ட்) ப (B p
  109. ற்) ப pV
  110. ற்) ப (B p
  111. ஃ) ப fV
  112. ஃ) ப (B f
  113. ம mV
  114. ம (B m
  115. ய jV
  116. ய (B j
  117. ர rV
  118. ர (B r
  119. ற RV
  120. ற (B R
  121. ற் (ற t. // RR -> t.R
  122. ல lV
  123. ல (B l
  124. ள l.V
  125. ள (B l.
  126. ழ z.V
  127. ழ (B z.
  128. வ vV
  129. வ (B v
  130. ஶ SV
  131. ஶ (B S
  132. ஷ s.V
  133. ஷ (B s.
  134. ஸ sV
  135. ஸ (B s
  136. ஹ hV
  137. ஹ (B h
  138. க்ஷ ks.V
  139. க்ஷ (B ks.
  140. // combining vowels
  141. ா a:
  142. ி i
  143. .group 0xe0af // characters which start with UTF-8 bytes: [e0 af]
  144. ீ i:
  145. ு u
  146. ூ u:
  147. ெ e
  148. ே e:
  149. ை aI
  150. ொ o
  151. ோ o:
  152. ௌ aU
  153. ் // virama
  154. ௗ : // aU length mark
  155. .group 0xe0a4 // devanagari
  156. \340\244 _^_HI // switch to hindi voice
  157. .group 0xe0a5 // devanagari
  158. \340\245 _^_HI
  159. .group
  160. ் // virama
  161. $ dolV
  162. D) . (D+ _pul.l.i