8f2aaaf79d
git-svn-id: svn://svn.rockbox.org/rockbox/trunk@20559 a1c6a512-1295-4272-9138-f99709370657
618 lines
16 KiB
C++
618 lines
16 KiB
C++
/***************************************************************************
|
|
* __________ __ ___.
|
|
* Open \______ \ ____ ____ | | _\_ |__ _______ ___
|
|
* Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
|
|
* Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
|
|
* Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
|
|
* \/ \/ \/ \/ \/
|
|
*
|
|
* Copyright (C) 2007 by Dominik Wenger
|
|
* $Id$
|
|
*
|
|
* All files in this archive are subject to the GNU General Public License.
|
|
* See the file COPYING in the source tree root for full license agreement.
|
|
*
|
|
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
|
|
* KIND, either express or implied.
|
|
*
|
|
****************************************************************************/
|
|
|
|
#include "tts.h"
|
|
|
|
|
|
// static variables
|
|
QMap<QString,QString> TTSBase::ttsList;
|
|
QMap<QString,TTSBase*> TTSBase::ttsCache;
|
|
|
|
// static functions
|
|
void TTSBase::initTTSList()
|
|
{
|
|
ttsList["espeak"] = "Espeak TTS Engine";
|
|
ttsList["flite"] = "Flite TTS Engine";
|
|
ttsList["swift"] = "Swift TTS Engine";
|
|
#if defined(Q_OS_WIN)
|
|
ttsList["sapi"] = "Sapi TTS Engine";
|
|
#endif
|
|
#if defined(Q_OS_LINUX)
|
|
ttsList["festival"] = "Festival TTS Engine";
|
|
#endif
|
|
}
|
|
|
|
// function to get a specific encoder
|
|
TTSBase* TTSBase::getTTS(QString ttsName)
|
|
{
|
|
// check cache
|
|
if(ttsCache.contains(ttsName))
|
|
return ttsCache.value(ttsName);
|
|
|
|
TTSBase* tts;
|
|
#if defined(Q_OS_WIN)
|
|
if(ttsName == "sapi")
|
|
{
|
|
tts = new TTSSapi();
|
|
ttsCache[ttsName] = tts;
|
|
return tts;
|
|
}
|
|
else
|
|
#endif
|
|
#if defined(Q_OS_LINUX)
|
|
if (ttsName == "festival")
|
|
{
|
|
tts = new TTSFestival();
|
|
ttsCache[ttsName] = tts;
|
|
return tts;
|
|
}
|
|
else
|
|
#endif
|
|
if (true) // fix for OS other than WIN or LINUX
|
|
{
|
|
tts = new TTSExes(ttsName);
|
|
ttsCache[ttsName] = tts;
|
|
return tts;
|
|
}
|
|
}
|
|
|
|
// get the list of encoders, nice names
|
|
QStringList TTSBase::getTTSList()
|
|
{
|
|
// init list if its empty
|
|
if(ttsList.count() == 0)
|
|
initTTSList();
|
|
|
|
return ttsList.keys();
|
|
}
|
|
|
|
// get nice name of a specific tts
|
|
QString TTSBase::getTTSName(QString tts)
|
|
{
|
|
if(ttsList.isEmpty())
|
|
initTTSList();
|
|
return ttsList.value(tts);
|
|
}
|
|
|
|
/*********************************************************************
|
|
* TTS Base
|
|
**********************************************************************/
|
|
TTSBase::TTSBase(): QObject()
|
|
{
|
|
|
|
}
|
|
|
|
/*********************************************************************
|
|
* General TTS Exes
|
|
**********************************************************************/
|
|
TTSExes::TTSExes(QString name) : TTSBase()
|
|
{
|
|
m_name = name;
|
|
|
|
m_TemplateMap["espeak"] = "\"%exe\" %options -w \"%wavfile\" \"%text\"";
|
|
m_TemplateMap["flite"] = "\"%exe\" %options -o \"%wavfile\" -t \"%text\"";
|
|
m_TemplateMap["swift"] = "\"%exe\" %options -o \"%wavfile\" \"%text\"";
|
|
|
|
}
|
|
|
|
void TTSExes::setCfg(RbSettings* sett)
|
|
{
|
|
// call function of base class
|
|
TTSBase::setCfg(sett);
|
|
|
|
// if the config isnt OK, try to autodetect
|
|
if(!configOk())
|
|
{
|
|
QString exepath;
|
|
//try autodetect tts
|
|
#if defined(Q_OS_LINUX) || defined(Q_OS_MACX) || defined(Q_OS_OPENBSD)
|
|
QStringList path = QString(getenv("PATH")).split(":", QString::SkipEmptyParts);
|
|
#elif defined(Q_OS_WIN)
|
|
QStringList path = QString(getenv("PATH")).split(";", QString::SkipEmptyParts);
|
|
#endif
|
|
qDebug() << path;
|
|
for(int i = 0; i < path.size(); i++)
|
|
{
|
|
QString executable = QDir::fromNativeSeparators(path.at(i)) + "/" + m_name;
|
|
#if defined(Q_OS_WIN)
|
|
executable += ".exe";
|
|
QStringList ex = executable.split("\"", QString::SkipEmptyParts);
|
|
executable = ex.join("");
|
|
#endif
|
|
qDebug() << executable;
|
|
if(QFileInfo(executable).isExecutable())
|
|
{
|
|
exepath= QDir::toNativeSeparators(executable);
|
|
break;
|
|
}
|
|
}
|
|
settings->setTTSPath(m_name,exepath);
|
|
settings->sync();
|
|
}
|
|
|
|
}
|
|
|
|
bool TTSExes::start(QString *errStr)
|
|
{
|
|
m_TTSexec = settings->ttsPath(m_name);
|
|
m_TTSOpts = settings->ttsOptions(m_name);
|
|
|
|
m_TTSTemplate = m_TemplateMap.value(m_name);
|
|
|
|
QFileInfo tts(m_TTSexec);
|
|
if(tts.exists())
|
|
{
|
|
return true;
|
|
}
|
|
else
|
|
{
|
|
*errStr = tr("TTS executable not found");
|
|
return false;
|
|
}
|
|
}
|
|
|
|
TTSStatus TTSExes::voice(QString text,QString wavfile, QString *errStr)
|
|
{
|
|
(void) errStr;
|
|
QString execstring = m_TTSTemplate;
|
|
|
|
execstring.replace("%exe",m_TTSexec);
|
|
execstring.replace("%options",m_TTSOpts);
|
|
execstring.replace("%wavfile",wavfile);
|
|
execstring.replace("%text",text);
|
|
//qDebug() << "voicing" << execstring;
|
|
QProcess::execute(execstring);
|
|
return NoError;
|
|
|
|
}
|
|
|
|
void TTSExes::showCfg()
|
|
{
|
|
#ifndef CONSOLE
|
|
TTSExesGui gui;
|
|
#else
|
|
TTSExesGuiCli gui;
|
|
#endif
|
|
gui.setCfg(settings);
|
|
gui.showCfg(m_name);
|
|
}
|
|
|
|
bool TTSExes::configOk()
|
|
{
|
|
QString path = settings->ttsPath(m_name);
|
|
|
|
if (QFileInfo(path).exists())
|
|
return true;
|
|
|
|
return false;
|
|
}
|
|
|
|
/*********************************************************************
|
|
* TTS Sapi
|
|
**********************************************************************/
|
|
TTSSapi::TTSSapi() : TTSBase()
|
|
{
|
|
m_TTSTemplate = "cscript //nologo \"%exe\" /language:%lang /voice:\"%voice\" /speed:%speed \"%options\"";
|
|
defaultLanguage ="english";
|
|
m_sapi4 =false;
|
|
}
|
|
|
|
|
|
bool TTSSapi::start(QString *errStr)
|
|
{
|
|
|
|
m_TTSOpts = settings->ttsOptions("sapi");
|
|
m_TTSLanguage =settings->ttsLang("sapi");
|
|
m_TTSVoice=settings->ttsVoice("sapi");
|
|
m_TTSSpeed=QString("%1").arg(settings->ttsSpeed("sapi"));
|
|
m_sapi4 = settings->ttsUseSapi4();
|
|
|
|
QFile::remove(QDir::tempPath() +"/sapi_voice.vbs");
|
|
QFile::copy(":/builtin/sapi_voice.vbs",QDir::tempPath() + "/sapi_voice.vbs");
|
|
m_TTSexec = QDir::tempPath() +"/sapi_voice.vbs";
|
|
|
|
QFileInfo tts(m_TTSexec);
|
|
if(!tts.exists())
|
|
{
|
|
*errStr = tr("Could not copy the Sapi-script");
|
|
return false;
|
|
}
|
|
// create the voice process
|
|
QString execstring = m_TTSTemplate;
|
|
execstring.replace("%exe",m_TTSexec);
|
|
execstring.replace("%options",m_TTSOpts);
|
|
execstring.replace("%lang",m_TTSLanguage);
|
|
execstring.replace("%voice",m_TTSVoice);
|
|
execstring.replace("%speed",m_TTSSpeed);
|
|
|
|
if(m_sapi4)
|
|
execstring.append(" /sapi4 ");
|
|
|
|
qDebug() << "init" << execstring;
|
|
voicescript = new QProcess(NULL);
|
|
//connect(voicescript,SIGNAL(readyReadStandardError()),this,SLOT(error()));
|
|
|
|
voicescript->start(execstring);
|
|
if(!voicescript->waitForStarted())
|
|
{
|
|
*errStr = tr("Could not start the Sapi-script");
|
|
return false;
|
|
}
|
|
|
|
if(!voicescript->waitForReadyRead(300))
|
|
{
|
|
*errStr = voicescript->readAllStandardError();
|
|
if(*errStr != "")
|
|
return false;
|
|
}
|
|
|
|
voicestream = new QTextStream(voicescript);
|
|
voicestream->setCodec("UTF16-LE");
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
QStringList TTSSapi::getVoiceList(QString language)
|
|
{
|
|
QStringList result;
|
|
|
|
QFile::copy(":/builtin/sapi_voice.vbs",QDir::tempPath() + "/sapi_voice.vbs");
|
|
m_TTSexec = QDir::tempPath() +"/sapi_voice.vbs";
|
|
|
|
QFileInfo tts(m_TTSexec);
|
|
if(!tts.exists())
|
|
return result;
|
|
|
|
// create the voice process
|
|
QString execstring = "cscript //nologo \"%exe\" /language:%lang /listvoices";
|
|
execstring.replace("%exe",m_TTSexec);
|
|
execstring.replace("%lang",language);
|
|
|
|
if(settings->ttsUseSapi4())
|
|
execstring.append(" /sapi4 ");
|
|
|
|
qDebug() << "init" << execstring;
|
|
voicescript = new QProcess(NULL);
|
|
voicescript->start(execstring);
|
|
qDebug() << "wait for started";
|
|
if(!voicescript->waitForStarted())
|
|
return result;
|
|
voicescript->closeWriteChannel();
|
|
voicescript->waitForReadyRead();
|
|
|
|
QString dataRaw = voicescript->readAllStandardError().data();
|
|
result = dataRaw.split(",",QString::SkipEmptyParts);
|
|
result.sort();
|
|
result.removeFirst();
|
|
for(int i = 0; i< result.size();i++)
|
|
{
|
|
result[i] = result.at(i).simplified();
|
|
}
|
|
|
|
|
|
delete voicescript;
|
|
QFile::setPermissions(QDir::tempPath() +"/sapi_voice.vbs",QFile::ReadOwner |QFile::WriteOwner|QFile::ExeOwner
|
|
|QFile::ReadUser| QFile::WriteUser| QFile::ExeUser
|
|
|QFile::ReadGroup |QFile::WriteGroup |QFile::ExeGroup
|
|
|QFile::ReadOther |QFile::WriteOther |QFile::ExeOther );
|
|
QFile::remove(QDir::tempPath() +"/sapi_voice.vbs");
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
|
|
TTSStatus TTSSapi::voice(QString text,QString wavfile, QString *errStr)
|
|
{
|
|
(void) errStr;
|
|
QString query = "SPEAK\t"+wavfile+"\t"+text+"\r\n";
|
|
qDebug() << "voicing" << query;
|
|
*voicestream << query;
|
|
*voicestream << "SYNC\tbla\r\n";
|
|
voicestream->flush();
|
|
voicescript->waitForReadyRead();
|
|
return NoError;
|
|
}
|
|
|
|
bool TTSSapi::stop()
|
|
{
|
|
|
|
*voicestream << "QUIT\r\n";
|
|
voicestream->flush();
|
|
voicescript->waitForFinished();
|
|
delete voicestream;
|
|
delete voicescript;
|
|
QFile::setPermissions(QDir::tempPath() +"/sapi_voice.vbs",QFile::ReadOwner |QFile::WriteOwner|QFile::ExeOwner
|
|
|QFile::ReadUser| QFile::WriteUser| QFile::ExeUser
|
|
|QFile::ReadGroup |QFile::WriteGroup |QFile::ExeGroup
|
|
|QFile::ReadOther |QFile::WriteOther |QFile::ExeOther );
|
|
QFile::remove(QDir::tempPath() +"/sapi_voice.vbs");
|
|
return true;
|
|
}
|
|
|
|
|
|
void TTSSapi::showCfg()
|
|
{
|
|
#ifndef CONSOLE
|
|
TTSSapiGui gui(this);
|
|
#else
|
|
TTSSapiGuiCli gui(this);
|
|
#endif
|
|
gui.setCfg(settings);
|
|
gui.showCfg();
|
|
}
|
|
|
|
bool TTSSapi::configOk()
|
|
{
|
|
if(settings->ttsVoice("sapi").isEmpty())
|
|
return false;
|
|
return true;
|
|
}
|
|
/**********************************************************************
|
|
* TSSFestival - client-server wrapper
|
|
**********************************************************************/
|
|
TTSFestival::~TTSFestival()
|
|
{
|
|
stop();
|
|
}
|
|
|
|
void TTSFestival::startServer()
|
|
{
|
|
if(!configOk())
|
|
return;
|
|
|
|
QStringList paths = settings->ttsPath("festival").split(":");
|
|
|
|
serverProcess.start(QString("%1 --server").arg(paths[0]));
|
|
serverProcess.waitForStarted();
|
|
|
|
queryServer("(getpid)");
|
|
if(serverProcess.state() == QProcess::Running)
|
|
qDebug() << "Festival is up and running";
|
|
else
|
|
qDebug() << "Festival failed to start";
|
|
}
|
|
|
|
void TTSFestival::ensureServerRunning()
|
|
{
|
|
if(serverProcess.state() != QProcess::Running)
|
|
{
|
|
// least common denominator for all the server startup code paths
|
|
QProgressDialog progressDialog(tr(""), tr(""), 0, 0);
|
|
progressDialog.setWindowTitle(tr("Starting festival"));
|
|
progressDialog.setModal(true);
|
|
progressDialog.setLabel(0);
|
|
progressDialog.setCancelButton(0);
|
|
progressDialog.show();
|
|
|
|
QApplication::processEvents(); // actually show the dialog
|
|
|
|
startServer();
|
|
}
|
|
}
|
|
|
|
bool TTSFestival::start(QString* errStr)
|
|
{
|
|
(void) errStr;
|
|
ensureServerRunning();
|
|
if (!settings->ttsVoice("festival").isEmpty())
|
|
queryServer(QString("(voice.select '%1)").arg(settings->ttsVoice("festival")));
|
|
|
|
return true;
|
|
}
|
|
|
|
bool TTSFestival::stop()
|
|
{
|
|
serverProcess.terminate();
|
|
serverProcess.kill();
|
|
|
|
return true;
|
|
}
|
|
|
|
TTSStatus TTSFestival::voice(QString text, QString wavfile, QString* errStr)
|
|
{
|
|
qDebug() << text << "->" << wavfile;
|
|
|
|
QStringList paths = settings->ttsPath("festival").split(":");
|
|
QString cmd = QString("%1 --server localhost --otype riff --ttw --withlisp --output \"%2\" - ").arg(paths[1]).arg(wavfile);
|
|
qDebug() << cmd;
|
|
|
|
QProcess clientProcess;
|
|
clientProcess.start(cmd);
|
|
clientProcess.write(QString("%1.\n").arg(text).toAscii());
|
|
clientProcess.waitForBytesWritten();
|
|
clientProcess.closeWriteChannel();
|
|
clientProcess.waitForReadyRead();
|
|
QString response = clientProcess.readAll();
|
|
response = response.trimmed();
|
|
if(!response.contains("Utterance"))
|
|
{
|
|
qDebug() << "Could not voice string: " << response;
|
|
*errStr = tr("engine could not voice string");
|
|
return Warning;
|
|
/* do not stop the voicing process because of a single string
|
|
TODO: needs proper settings */
|
|
}
|
|
clientProcess.closeReadChannel(QProcess::StandardError);
|
|
clientProcess.closeReadChannel(QProcess::StandardOutput);
|
|
clientProcess.terminate();
|
|
clientProcess.kill();
|
|
|
|
return NoError;
|
|
}
|
|
|
|
bool TTSFestival::configOk()
|
|
{
|
|
QStringList paths = settings->ttsPath("festival").split(":");
|
|
if(paths.size() != 2)
|
|
return false;
|
|
bool ret = QFileInfo(paths[0]).isExecutable() &&
|
|
QFileInfo(paths[1]).isExecutable();
|
|
if(settings->ttsVoice("festival").size() > 0 && voices.size() > 0)
|
|
ret = ret && (voices.indexOf(settings->ttsVoice("festival")) != -1);
|
|
return ret;
|
|
}
|
|
|
|
void TTSFestival::showCfg()
|
|
{
|
|
#ifndef CONSOLE
|
|
TTSFestivalGui gui(this);
|
|
#endif
|
|
gui.setCfg(settings);
|
|
gui.showCfg();
|
|
}
|
|
|
|
QStringList TTSFestival::getVoiceList()
|
|
{
|
|
if(!configOk())
|
|
return QStringList();
|
|
|
|
if(voices.size() > 0)
|
|
{
|
|
qDebug() << "Using voice cache";
|
|
return voices;
|
|
}
|
|
QString response = queryServer("(voice.list)");
|
|
|
|
// get the 2nd line. It should be (<voice_name>, <voice_name>)
|
|
response = response.mid(response.indexOf('\n') + 1, -1);
|
|
response = response.left(response.indexOf('\n')).trimmed();
|
|
|
|
voices = response.mid(1, response.size()-2).split(' ');
|
|
|
|
voices.sort();
|
|
if (voices.size() == 1 && voices[0].size() == 0)
|
|
voices.removeAt(0);
|
|
if (voices.size() > 0)
|
|
qDebug() << "Voices: " << voices;
|
|
else
|
|
qDebug() << "No voices.";
|
|
return voices;
|
|
}
|
|
|
|
QString TTSFestival::getVoiceInfo(QString voice)
|
|
{
|
|
if(!configOk())
|
|
return "";
|
|
|
|
if(!getVoiceList().contains(voice))
|
|
return "";
|
|
|
|
if(voiceDescriptions.contains(voice))
|
|
return voiceDescriptions[voice];
|
|
|
|
QString response = queryServer(QString("(voice.description '%1)").arg(voice), 3000);
|
|
|
|
if (response == "")
|
|
{
|
|
voiceDescriptions[voice]=tr("No description available");
|
|
}
|
|
else
|
|
{
|
|
response = response.remove(QRegExp("(description \"*\")", Qt::CaseInsensitive, QRegExp::Wildcard));
|
|
qDebug() << "voiceInfo w/o descr: " << response;
|
|
response = response.remove(')');
|
|
QStringList responseLines = response.split('(', QString::SkipEmptyParts);
|
|
responseLines.removeAt(0); // the voice name itself
|
|
|
|
QString description;
|
|
foreach(QString line, responseLines)
|
|
{
|
|
line = line.remove('(');
|
|
line = line.simplified();
|
|
|
|
line[0] = line[0].toUpper(); // capitalize the key
|
|
|
|
int firstSpace = line.indexOf(' ');
|
|
if (firstSpace > 0)
|
|
{
|
|
line = line.insert(firstSpace, ':'); // add a colon between the key and the value
|
|
line[firstSpace+2] = line[firstSpace+2].toUpper(); // capitalize the value
|
|
}
|
|
|
|
description += line + "\n";
|
|
}
|
|
voiceDescriptions[voice] = description.trimmed();
|
|
}
|
|
return voiceDescriptions[voice];
|
|
}
|
|
|
|
QString TTSFestival::queryServer(QString query, int timeout)
|
|
{
|
|
if(!configOk())
|
|
return "";
|
|
|
|
ensureServerRunning();
|
|
|
|
qDebug() << "queryServer with " << query;
|
|
QString response;
|
|
|
|
QDateTime endTime;
|
|
if(timeout > 0)
|
|
endTime = QDateTime::currentDateTime().addMSecs(timeout);
|
|
|
|
/* Festival is *extremely* unreliable. Although at this
|
|
* point we are sure that SIOD is accepting commands,
|
|
* we might end up with an empty response. Hence, the loop.
|
|
*/
|
|
while(true)
|
|
{
|
|
QApplication::processEvents(QEventLoop::AllEvents, 50);
|
|
QTcpSocket socket;
|
|
|
|
socket.connectToHost("localhost", 1314);
|
|
socket.waitForConnected();
|
|
|
|
if(socket.state() == QAbstractSocket::ConnectedState)
|
|
{
|
|
socket.write(QString("%1\n").arg(query).toAscii());
|
|
socket.waitForBytesWritten();
|
|
socket.waitForReadyRead();
|
|
|
|
response = socket.readAll().trimmed();
|
|
|
|
if (response != "LP" && response != "")
|
|
break;
|
|
}
|
|
socket.abort();
|
|
socket.disconnectFromHost();
|
|
|
|
if(timeout > 0 && QDateTime::currentDateTime() >= endTime)
|
|
return "";
|
|
|
|
/* make sure we wait a little as we don't want to flood the server with requests */
|
|
QDateTime tmpEndTime = QDateTime::currentDateTime().addMSecs(500);
|
|
while(QDateTime::currentDateTime() < tmpEndTime)
|
|
QApplication::processEvents(QEventLoop::AllEvents);
|
|
}
|
|
if(response == "nil")
|
|
return "";
|
|
|
|
QStringList lines = response.split('\n');
|
|
if(lines.size() > 2)
|
|
{
|
|
lines.removeFirst();
|
|
lines.removeLast();
|
|
}
|
|
else
|
|
qDebug() << "Response too short: " << response;
|
|
return lines.join("\n");
|
|
}
|
|
|