eSpeak NG is an open source speech synthesizer that supports more than hundred languages and accents.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

voice.h 3.4KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. /***************************************************************************
  2. * Copyright (C) 2005 to 2007 by Jonathan Duddington *
  3. * email: [email protected] *
  4. * *
  5. * This program is free software; you can redistribute it and/or modify *
  6. * it under the terms of the GNU General Public License as published by *
  7. * the Free Software Foundation; either version 3 of the License, or *
  8. * (at your option) any later version. *
  9. * *
  10. * This program is distributed in the hope that it will be useful, *
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of *
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
  13. * GNU General Public License for more details. *
  14. * *
  15. * You should have received a copy of the GNU General Public License *
  16. * along with this program; if not, write see: *
  17. * <http://www.gnu.org/licenses/>. *
  18. ***************************************************************************/
  19. typedef struct {
  20. char v_name[40];
  21. int phoneme_tab_ix; // phoneme table number
  22. int pitch_base; // Hz<<12
  23. int pitch_range; // standard = 0x1000
  24. int speedf1;
  25. int speedf2;
  26. int speedf3;
  27. int flutter;
  28. int roughness;
  29. int echo_delay;
  30. int echo_amp;
  31. int n_harmonic_peaks; // highest formant which is formed from adding harmonics
  32. int peak_shape; // alternative shape for formant peaks (0=standard 1=squarer)
  33. int voicing; // 100% = 64, level of formant-synthesized sound
  34. int formant_factor; // adjust nominal formant frequencies by this because of the voice's pitch (256ths)
  35. int consonant_amp; // amplitude of unvoiced consonants
  36. int consonant_ampv; // amplitude of the noise component of voiced consonants
  37. int klatt[8];
  38. // parameters used by Wavegen
  39. short freq[N_PEAKS]; // 100% = 256
  40. short height[N_PEAKS]; // 100% = 256
  41. short width[N_PEAKS]; // 100% = 256
  42. short freqadd[N_PEAKS]; // Hz
  43. // copies without temporary adjustments from embedded commands
  44. short freq2[N_PEAKS]; // 100% = 256
  45. short height2[N_PEAKS]; // 100% = 256
  46. short width2[N_PEAKS]; // 100% = 256
  47. int breath[N_PEAKS]; // amount of breath for each formant. breath[0] indicates whether any are set.
  48. int breathw[N_PEAKS]; // width of each breath formant
  49. // This table provides the opportunity for tone control.
  50. // Adjustment of harmonic amplitudes, steps of 8Hz
  51. // value of 128 means no change
  52. #define N_TONE_ADJUST 1000
  53. unsigned char tone_adjust[N_TONE_ADJUST]; // 8Hz steps * 1000 = 8kHz
  54. } voice_t;
  55. // percentages shown to user, ix=N_PEAKS means ALL peaks
  56. extern USHORT voice_pcnt[N_PEAKS+1][3];
  57. extern voice_t *voice;
  58. extern int tone_points[12];
  59. const char *SelectVoice(espeak_VOICE *voice_select);
  60. espeak_VOICE *SelectVoiceByName(espeak_VOICE **voices, const char *name);
  61. voice_t *LoadVoice(const char *voice_name, int control);
  62. voice_t *LoadVoiceVariant(const char *voice_name, int variant);
  63. void DoVoiceChange(voice_t *v);
  64. void WavegenSetVoice(voice_t *v);
  65. void ReadTonePoints(char *string, int *tone_pts);