eSpeak NG is an open source speech synthesizer that supports more than hundred languages and accents.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

ta_rules 1.8KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185
  1. // This file is UTF8 encoded
  2. // Spelling to phoneme rules for Tamil
  3. // B means a combining vowel sign, or a virama
  4. .replace
  5. ௦ 0 // Tamil numbers
  6. ௧ 1
  7. ௨ 2
  8. ௩ 3
  9. ௪ 4
  10. ௫ 5
  11. ௬ 6
  12. ௭ 7
  13. ௮ 8
  14. ௯ 9
  15. .
  16. .group 0xe0ae // characters which start with UTF-8 bytes: [e0 ae]
  17. ஂ // anusvara
  18. ஃ // visarga
  19. அ a
  20. ஆ a:
  21. இ i
  22. ஈ i:
  23. உ u
  24. ஊ u:
  25. எ e
  26. ஏ e::
  27. ஐ E:
  28. ஒ o
  29. ஓ o:
  30. ஔ aU
  31. // consonants
  32. க gV // inter-vocalic, unless there is virama before or after
  33. க (B g
  34. க (் g
  35. ்) க gV
  36. ்) க (B g
  37. _) க kV
  38. _) க (B k
  39. க்க kkV
  40. க்க (B kk
  41. ங NV
  42. ங (B N
  43. ச dZV
  44. ச (B dZ
  45. _) ச sa
  46. _) ச (B s
  47. ச்ச tS:V
  48. ச்ச (B tS:
  49. ஜ dZV
  50. ஜ (B dZ
  51. ஞ n^V
  52. ஞ (B n^
  53. ட d.V
  54. ட (B d.
  55. _) ட t.V
  56. _) ட (B t.
  57. ட்ட t.t.V
  58. ட்ட (B t.t.
  59. ண n.V
  60. ண (B n.
  61. த dV
  62. த (B d
  63. _) த tV
  64. _) த (B t
  65. த்த ttV
  66. த்த (B tt
  67. ந nV
  68. ந (B n // dental n
  69. ன nV
  70. ன (B n // alveolar n
  71. ப bV
  72. ப (B b
  73. _) ப pV
  74. _) ப (B p
  75. ப்ப ppV
  76. ப்ப (B pp
  77. ஃ) ப fV
  78. ஃ) ப (B f
  79. ம mV
  80. ம (B m
  81. ய jV
  82. ய (B j
  83. ர rV
  84. ர (B r
  85. ற RV
  86. ற (B R
  87. ற் (ற t. // RR -> t.R
  88. ல lV
  89. ல (B l
  90. ள l.V
  91. ள (B l.
  92. ழ z.V
  93. ழ (B z.
  94. வ vV
  95. வ (B v
  96. ஶ SV
  97. ஶ (B S
  98. ஷ s.V
  99. ஷ (B s.
  100. ஸ sV
  101. ஸ (B s
  102. ஹ hV
  103. ஹ (B h
  104. // combining vowels
  105. ா a:
  106. ி i
  107. .group 0xe0af // characters which start with UTF-8 bytes: [e0 af]
  108. ீ i:
  109. ு u
  110. ூ u:
  111. ெ e
  112. ே e:
  113. ை E:
  114. ொ o
  115. ோ o:
  116. ௌ aU
  117. ் // virama
  118. ௗ : // aU length mark
  119. .group 0xe0a4 // devanagari
  120. \340\244 _^_HI // switch to hindi voice
  121. .group 0xe0a5 // devanagari
  122. \340\245 _^_HI
  123. .group
  124. ் // virama
  125. $ dolV