| @@ -17,8 +17,10 @@ | |||
| #include "config.h" | |||
| #include <string.h> | |||
| #include <stdint.h> | |||
| #include <stdlib.h> | |||
| #include <wchar.h> | |||
| #include <espeak-ng/espeak_ng.h> | |||
| @@ -684,6 +686,8 @@ text_decoder_decode_string(espeak_ng_TEXT_DECODER *decoder, | |||
| if (enc->get == NULL) | |||
| return ENS_UNKNOWN_TEXT_ENCODING; | |||
| if (length < 0) length = string ? strlen(string) + 1 : 0; | |||
| decoder->get = string ? enc->get : null_decoder_getc; | |||
| decoder->codepage = enc->codepage; | |||
| decoder->current = (const uint8_t *)string; | |||
| @@ -704,6 +708,8 @@ text_decoder_decode_string_auto(espeak_ng_TEXT_DECODER *decoder, | |||
| if (enc->get == NULL) | |||
| return ENS_UNKNOWN_TEXT_ENCODING; | |||
| if (length < 0) length = string ? strlen(string) + 1 : 0; | |||
| decoder->get = string ? string_decoder_getc_auto : null_decoder_getc; | |||
| decoder->codepage = enc->codepage; | |||
| decoder->current = (const uint8_t *)string; | |||
| @@ -716,6 +722,8 @@ text_decoder_decode_wstring(espeak_ng_TEXT_DECODER *decoder, | |||
| const wchar_t *string, | |||
| int length) | |||
| { | |||
| if (length < 0) length = string ? wcslen(string) + 1 : 0; | |||
| decoder->get = string ? string_decoder_getc_wchar : null_decoder_getc; | |||
| decoder->codepage = NULL; | |||
| decoder->current = (const uint8_t *)string; | |||
| @@ -1,7 +1,7 @@ | |||
| /* | |||
| * Copyright (C) 2005 to 2015 by Jonathan Duddington | |||
| * email: [email protected] | |||
| * Copyright (C) 2015-2016 Reece H. Dunn | |||
| * Copyright (C) 2015-2017 Reece H. Dunn | |||
| * | |||
| * This program is free software; you can redistribute it and/or modify | |||
| * it under the terms of the GNU General Public License as published by | |||
| @@ -1,7 +1,7 @@ | |||
| /* | |||
| * Copyright (C) 2005 to 2014 by Jonathan Duddington | |||
| * email: [email protected] | |||
| * Copyright (C) 2015-2016 Reece H. Dunn | |||
| * Copyright (C) 2015-2017 Reece H. Dunn | |||
| * | |||
| * This program is free software; you can redistribute it and/or modify | |||
| * it under the terms of the GNU General Public License as published by | |||
| @@ -1916,21 +1916,6 @@ int UpperCaseInWord(Translator *tr, char *word, int c) | |||
| return 0; | |||
| } | |||
| static inline espeak_ng_STATUS init_wstring_decoder(const wchar_t *text) | |||
| { | |||
| return text_decoder_decode_wstring(p_decoder, text, wcslen(text) + 1); | |||
| } | |||
| static inline espeak_ng_STATUS init_string_decoder(const char *text, espeak_ng_ENCODING encoding) | |||
| { | |||
| return text_decoder_decode_string(p_decoder, text, strlen(text) + 1, encoding); | |||
| } | |||
| static inline espeak_ng_STATUS init_string_decoder_auto(const char *text, espeak_ng_ENCODING encoding) | |||
| { | |||
| return text_decoder_decode_string_auto(p_decoder, text, strlen(text) + 1, encoding); | |||
| } | |||
| const void *TranslateClause(Translator *tr, const void *vp_input, int *tone_out, char **voice_change) | |||
| { | |||
| int ix; | |||
| @@ -1988,19 +1973,19 @@ const void *TranslateClause(Translator *tr, const void *vp_input, int *tone_out, | |||
| switch (option_multibyte) | |||
| { | |||
| case espeakCHARS_WCHAR: | |||
| init_wstring_decoder((const wchar_t *)vp_input); | |||
| text_decoder_decode_wstring(p_decoder, (const wchar_t *)vp_input, -1); | |||
| break; | |||
| case espeakCHARS_AUTO: | |||
| init_string_decoder_auto((const char *)vp_input, tr->encoding); | |||
| text_decoder_decode_string_auto(p_decoder, (const char *)vp_input, -1, tr->encoding); | |||
| break; | |||
| case espeakCHARS_UTF8: | |||
| init_string_decoder((const char *)vp_input, ESPEAKNG_ENCODING_UTF_8); | |||
| text_decoder_decode_string(p_decoder, (const char *)vp_input, -1, ESPEAKNG_ENCODING_UTF_8); | |||
| break; | |||
| case espeakCHARS_8BIT: | |||
| init_string_decoder((const char *)vp_input, tr->encoding); | |||
| text_decoder_decode_string(p_decoder, (const char *)vp_input, -1, tr->encoding); | |||
| break; | |||
| case espeakCHARS_16BIT: | |||
| init_string_decoder((const char *)vp_input, ESPEAKNG_ENCODING_ISO_10646_UCS_2); | |||
| text_decoder_decode_string(p_decoder, (const char *)vp_input, -1, ESPEAKNG_ENCODING_ISO_10646_UCS_2); | |||
| break; | |||
| default: | |||
| return NULL; // unknown multibyte option value | |||
| @@ -736,11 +736,21 @@ test_char_decoder() | |||
| espeak_ng_TEXT_DECODER *decoder = create_text_decoder(); | |||
| // null string | |||
| assert(text_decoder_decode_string(decoder, NULL, 5, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_decode_string(decoder, NULL, -1, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| // string length | |||
| assert(text_decoder_decode_string(decoder, "aG", -1, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'a'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'G'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| destroy_text_decoder(decoder); | |||
| } | |||
| @@ -752,11 +762,12 @@ test_wchar_decoder() | |||
| espeak_ng_TEXT_DECODER *decoder = create_text_decoder(); | |||
| // null string | |||
| assert(text_decoder_decode_wstring(decoder, NULL, 5) == ENS_OK); | |||
| assert(text_decoder_decode_wstring(decoder, NULL, -1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| // wide-character string | |||
| assert(text_decoder_decode_wstring(decoder, L"aG\xA0\x2045", 4) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'a'); | |||
| @@ -768,6 +779,20 @@ test_wchar_decoder() | |||
| assert(text_decoder_getc(decoder) == 0x2045); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| // string length | |||
| assert(text_decoder_decode_wstring(decoder, L"aG\xA0\x2045", -1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'a'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'G'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 0xA0); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 0x2045); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| destroy_text_decoder(decoder); | |||
| } | |||
| @@ -779,7 +804,7 @@ test_auto_decoder() | |||
| espeak_ng_TEXT_DECODER *decoder = create_text_decoder(); | |||
| // null string | |||
| assert(text_decoder_decode_string_auto(decoder, NULL, 5, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_decode_string_auto(decoder, NULL, -1, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| @@ -808,6 +833,16 @@ test_auto_decoder() | |||
| assert(text_decoder_getc(decoder) == 'f'); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| // string length | |||
| assert(text_decoder_decode_string_auto(decoder, "aG", -1, ESPEAKNG_ENCODING_ISO_8859_1) == ENS_OK); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'a'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 'G'); | |||
| assert(text_decoder_eof(decoder) == 0); | |||
| assert(text_decoder_getc(decoder) == 0); | |||
| assert(text_decoder_eof(decoder) == 1); | |||
| destroy_text_decoder(decoder); | |||
| } | |||