scummvm/backends/text-to-speech/linux/linux-text-to-speech.cpp

280 lines
8.6 KiB
C++
Raw Normal View History

2019-07-10 10:49:29 +02:00
/* ScummVM - Graphic Adventure Engine
*
* ScummVM is the legal property of its developers, whose names
* are too numerous to list here. Please refer to the COPYRIGHT
* file distributed with this source distribution.
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
*
*/
// Disable symbol overrides so that we can use system headers.
#define FORBIDDEN_SYMBOL_ALLOW_ALL
#include "backends/text-to-speech/linux/linux-text-to-speech.h"
#if defined(USE_LINUX_TTS)
2019-07-11 00:14:28 +02:00
#include <speech-dispatcher/libspeechd.h>
#include "backends/platform/sdl/sdl-sys.h"
//#include <iconv.h>
2019-07-11 00:14:28 +02:00
2019-07-10 10:49:29 +02:00
#include "common/translation.h"
2019-07-11 00:14:28 +02:00
#include "common/system.h"
#include "common/ustr.h"
#include "common/config-manager.h"
2019-07-11 00:14:28 +02:00
SPDConnection *_connection;
void speech_begin_callback(size_t msg_id, size_t client_id, SPDNotificationType state){
LinuxTextToSpeechManager *manager =
static_cast<LinuxTextToSpeechManager *> (g_system->getTextToSpeechManager());
manager->updateState(LinuxTextToSpeechManager::SPEAKING);
}
void speech_end_callback(size_t msg_id, size_t client_id, SPDNotificationType state){
LinuxTextToSpeechManager *manager =
static_cast<LinuxTextToSpeechManager *> (g_system->getTextToSpeechManager());
manager->updateState(LinuxTextToSpeechManager::READY);
}
void speech_cancel_callback(size_t msg_id, size_t client_id, SPDNotificationType state){
LinuxTextToSpeechManager *manager =
static_cast<LinuxTextToSpeechManager *> (g_system->getTextToSpeechManager());
manager->updateState(LinuxTextToSpeechManager::READY);
}
void speech_resume_callback(size_t msg_id, size_t client_id, SPDNotificationType state){
LinuxTextToSpeechManager *manager =
static_cast<LinuxTextToSpeechManager *> (g_system->getTextToSpeechManager());
manager->updateState(LinuxTextToSpeechManager::SPEAKING);
}
void speech_pause_callback(size_t msg_id, size_t client_id, SPDNotificationType state){
LinuxTextToSpeechManager *manager =
static_cast<LinuxTextToSpeechManager *> (g_system->getTextToSpeechManager());
manager->updateState(LinuxTextToSpeechManager::PAUSED);
}
LinuxTextToSpeechManager::LinuxTextToSpeechManager()
: _speechState(READY) {
init();
}
void LinuxTextToSpeechManager::init() {
2019-07-11 00:14:28 +02:00
_connection = spd_open("ScummVM", "main", NULL, SPD_MODE_THREADED);
if (_connection == 0) {
_speechState = BROKEN;
warning("Couldn't initialize text to speech through speech-dispatcher");
2019-07-11 00:14:28 +02:00
return;
}
2019-07-10 10:49:29 +02:00
2019-07-11 00:14:28 +02:00
_connection->callback_begin = speech_begin_callback;
spd_set_notification_on(_connection, SPD_BEGIN);
_connection->callback_end = speech_end_callback;
spd_set_notification_on(_connection, SPD_END);
_connection->callback_cancel = speech_cancel_callback;
spd_set_notification_on(_connection, SPD_CANCEL);
_connection->callback_resume = speech_resume_callback;
spd_set_notification_on(_connection, SPD_RESUME);
_connection->callback_pause = speech_pause_callback;
spd_set_notification_on(_connection, SPD_PAUSE);
updateVoices();
_ttsState->_activeVoice = 0;
#ifdef USE_TRANSLATION
setLanguage(TransMan.getCurrentLanguage());
#else
setLanguage("en");
#endif
2019-07-10 10:49:29 +02:00
}
LinuxTextToSpeechManager::~LinuxTextToSpeechManager() {
if (_connection != 0)
spd_close(_connection);
2019-07-11 00:14:28 +02:00
}
void LinuxTextToSpeechManager::updateState(LinuxTextToSpeechManager::SpeechState state) {
_speechState = state;
}
Common::String LinuxTextToSpeechManager::strToUtf8(Common::String str, Common::String charset) {
#if SDL_VERSION_ATLEAST(2, 0, 0)
char *conv_text = SDL_iconv_string("UTF-8", charset.c_str(), str.c_str(), str.size() + 1);
Common::String result;
if (conv_text) {
result = conv_text;
SDL_free(conv_text);
} else if (charset != "ASCII"){
warning("Could not convert text from %s to UTF-8, trying ASCII", charset.c_str());
return strToUtf8(str, "ASCII");
} else
warning("Could not convert text to UTF-8");
return result;
#else
return Common::String();
#endif
}
bool LinuxTextToSpeechManager::say(Common::String str, Action action, Common::String charset) {
if (_speechState == BROKEN)
return true;
if (action == DROP && isSpeaking())
return true;
if (charset.empty()) {
#ifdef USE_TRANSLATION
charset = TransMan.getCurrentCharset();
#else
charset = "ASCII";
#endif
}
str = strToUtf8(str, charset);
if (isSpeaking() && action == INTERRUPT)
2019-07-11 00:14:28 +02:00
stop();
if (str.size() != 0)
_speechState = SPEAKING;
if(spd_say(_connection, SPD_MESSAGE, str.c_str()) == -1) {
//restart the connection
if (_connection != 0)
spd_close(_connection);
init();
return true;
}
return false;
2019-07-11 00:14:28 +02:00
}
bool LinuxTextToSpeechManager::stop() {
if (_speechState == READY || _speechState == BROKEN)
return true;
_speechState = READY;
2019-07-11 00:14:28 +02:00
return spd_cancel(_connection) == -1;
}
bool LinuxTextToSpeechManager::pause() {
if (_speechState == READY || _speechState == PAUSED || _speechState == BROKEN)
return true;
_speechState = PAUSED;
2019-07-11 00:14:28 +02:00
return spd_pause(_connection) == -1;
}
bool LinuxTextToSpeechManager::resume() {
if (_speechState == READY || _speechState == SPEAKING || _speechState == BROKEN)
return true;
_speechState = SPEAKING;
2019-07-11 00:14:28 +02:00
return spd_resume(_connection) == -1;
}
bool LinuxTextToSpeechManager::isSpeaking() {
return _speechState == SPEAKING;
}
bool LinuxTextToSpeechManager::isPaused() {
return _speechState == PAUSED;
}
bool LinuxTextToSpeechManager::isReady() {
return _speechState == READY;
2019-07-11 00:14:28 +02:00
}
void LinuxTextToSpeechManager::setVoice(unsigned index) {
if (_speechState == BROKEN)
return;
assert(index < _ttsState->_availableVoices.size());
Common::TTSVoice voice = _ttsState->_availableVoices[index];
spd_set_voice_type(_connection, *(SPDVoiceType *)(voice.getData()));
_ttsState->_activeVoice = index;
2019-07-11 00:14:28 +02:00
}
void LinuxTextToSpeechManager::setRate(int rate) {
if (_speechState == BROKEN)
return;
2019-07-11 00:14:28 +02:00
assert(rate >= -100 && rate <= 100);
spd_set_voice_rate(_connection, rate);
_ttsState->_rate = rate;
}
void LinuxTextToSpeechManager::setPitch(int pitch) {
if (_speechState == BROKEN)
return;
2019-07-11 00:14:28 +02:00
assert(pitch >= -100 && pitch <= 100);
spd_set_voice_pitch(_connection, pitch);
_ttsState->_pitch = pitch;
}
2019-07-12 12:52:18 +02:00
void LinuxTextToSpeechManager::setVolume(unsigned volume) {
if (_speechState == BROKEN)
return;
2019-07-12 12:52:18 +02:00
assert(volume <= 100);
spd_set_volume(_connection, (volume - 50) * 2);
2019-07-11 00:14:28 +02:00
_ttsState->_volume = volume;
}
void LinuxTextToSpeechManager::setLanguage(Common::String language) {
if (_speechState == BROKEN)
return;
2019-07-11 00:14:28 +02:00
spd_set_language(_connection, language.c_str());
_ttsState->_language = language;
setVoice(_ttsState->_activeVoice);
2019-07-11 00:14:28 +02:00
}
2019-07-17 13:33:42 +02:00
void LinuxTextToSpeechManager::createVoice(int typeNumber, Common::TTSVoice::Gender gender, Common::TTSVoice::Age age, char *description) {
2019-07-12 22:16:44 +02:00
SPDVoiceType *type = (SPDVoiceType *) malloc(sizeof(SPDVoiceType));
*type = static_cast<SPDVoiceType>(typeNumber);
Common::TTSVoice voice(gender, age, (void *) type, description);
_ttsState->_availableVoices.push_back(voice);
2019-07-12 22:16:44 +02:00
}
2019-07-11 00:14:28 +02:00
void LinuxTextToSpeechManager::updateVoices() {
if (_speechState == BROKEN)
return;
2019-07-11 00:14:28 +02:00
/* just use these voices:
SPD_MALE1, SPD_MALE2, SPD_MALE3,
SPD_FEMALE1, SPD_FEMALE2, SPD_FEMALE3,
SPD_CHILD_MALE, SPD_CHILD_FEMALE
it depends on the user to map them to the right voices in speech-dispatcher
configuration
*/
_ttsState->_availableVoices.clear();
2019-07-11 00:14:28 +02:00
2019-07-12 22:16:44 +02:00
char **voiceInfo = spd_list_voices(_connection);
2019-07-11 00:14:28 +02:00
2019-07-17 13:33:42 +02:00
createVoice(SPD_MALE1, Common::TTSVoice::MALE, Common::TTSVoice::ADULT, voiceInfo[0]);
createVoice(SPD_MALE2, Common::TTSVoice::MALE, Common::TTSVoice::ADULT, voiceInfo[1]);
createVoice(SPD_MALE3, Common::TTSVoice::MALE, Common::TTSVoice::ADULT, voiceInfo[2]);
createVoice(SPD_FEMALE1, Common::TTSVoice::FEMALE, Common::TTSVoice::ADULT, voiceInfo[3]);
createVoice(SPD_FEMALE2, Common::TTSVoice::FEMALE, Common::TTSVoice::ADULT, voiceInfo[4]);
createVoice(SPD_FEMALE3, Common::TTSVoice::FEMALE, Common::TTSVoice::ADULT, voiceInfo[5]);
createVoice(SPD_CHILD_MALE, Common::TTSVoice::MALE, Common::TTSVoice::CHILD, voiceInfo[6]);
createVoice(SPD_CHILD_FEMALE, Common::TTSVoice::FEMALE, Common::TTSVoice::CHILD, voiceInfo[7]);
2019-07-11 00:14:28 +02:00
for (int i = 0; i < 8; i++)
free(voiceInfo[i]);
free(voiceInfo);
2019-07-10 10:49:29 +02:00
}
void LinuxTextToSpeechManager::freeVoiceData(void *data) {
free(data);
}
2019-07-10 10:49:29 +02:00
#endif