LunaTranslator/cpp/implsapi.cpp

115 lines
4.4 KiB
C++
Raw Normal View History

2024-05-17 22:53:40 +08:00
2024-12-29 19:32:24 +08:00
wchar_t SPCAT_VOICES_7[] = LR"(HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Speech\Voices)";
wchar_t SPCAT_VOICES_10[] = LR"(HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Speech_OneCore\Voices)";
2024-07-14 15:09:37 +08:00
std::optional<std::vector<byte>> _Speak(std::wstring &Content, const wchar_t *token, int voiceid, int rate, int volume)
2024-05-17 22:53:40 +08:00
{
2024-07-14 15:09:37 +08:00
std::optional<std::vector<byte>> ret = {};
2024-12-29 18:09:35 +08:00
[&]()
2024-05-17 22:53:40 +08:00
{
2024-12-29 18:09:35 +08:00
CO_INIT co;
CHECK_FAILURE_NORET(co);
CComPtr<ISpVoice> pVoice = NULL;
CHECK_FAILURE_NORET(pVoice.CoCreateInstance(CLSID_SpVoice, NULL, CLSCTX_ALL));
2024-12-29 15:35:27 +08:00
CComPtr<IEnumSpObjectTokens> pSpEnumTokens = NULL;
2024-12-29 18:09:35 +08:00
CHECK_FAILURE_NORET(SpEnumTokens(token, NULL, NULL, &pSpEnumTokens));
ULONG ulTokensNumber = 0;
pSpEnumTokens->GetCount(&ulTokensNumber);
ISpObjectToken *m_pISpObjectToken;
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
pSpEnumTokens->Item(voiceid, &m_pISpObjectToken);
pVoice->SetVoice(m_pISpObjectToken);
pVoice->SetRate(rate);
pVoice->SetVolume(volume);
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
CComPtr<ISpStream> cpWavStream;
CComPtr<ISpStreamFormat> cpOldStream;
CSpStreamFormat originalFmt;
CComPtr<IStream> pMemStream;
CHECK_FAILURE_NORET(pVoice->GetOutputStream(&cpOldStream));
originalFmt.AssignFormat(cpOldStream);
CHECK_FAILURE_NORET(CreateStreamOnHGlobal(NULL, TRUE, &pMemStream));
CHECK_FAILURE_NORET(cpWavStream.CoCreateInstance(CLSID_SpStream));
CHECK_FAILURE_NORET(cpWavStream->SetBaseStream(pMemStream, SPDFID_WaveFormatEx, originalFmt.WaveFormatExPtr()));
pVoice->SetOutput(cpWavStream, TRUE);
pVoice->Speak(Content.c_str(), SPF_IS_XML, NULL);
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
/*To verify that the data has been written correctly, uncomment this, you should hear the voice.
cpVoice->SetOutput(NULL, FALSE);
cpVoice->SpeakStream(cpStream, SPF_DEFAULT, NULL);
*/
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
// After SAPI writes the stream, the stream position is at the end, so we need to set it to the beginning.
_LARGE_INTEGER a = {0};
CHECK_FAILURE_NORET(cpWavStream->Seek(a, STREAM_SEEK_SET, NULL));
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
// get the base istream from the ispstream
CComPtr<IStream> pIstream;
cpWavStream->GetBaseStream(&pIstream);
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
// calculate the size that is to be read
STATSTG stats;
pIstream->Stat(&stats, STATFLAG_NONAME);
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
ULONG sSize = stats.cbSize.QuadPart; // size of the data to be read
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
ULONG bytesRead; // this will tell the number of bytes that have been read
std::vector<byte> datas;
2025-01-02 22:56:39 +08:00
datas.resize(sSize + 46);
2024-12-29 18:09:35 +08:00
auto pBuffer = datas.data(); // buffer to read the data
// memcpy(pBuffer,&wavHeader,sizeof(WAV_HEADER));
2025-01-02 22:56:39 +08:00
int fsize = sSize + 46;
2024-12-29 18:09:35 +08:00
int ptr = 0;
memcpy(pBuffer, "RIFF", 4);
ptr += 4;
memcpy(pBuffer + ptr, &fsize, 4);
ptr += 4;
memcpy(pBuffer + ptr, "WAVEfmt ", 8);
ptr += 8;
memcpy(pBuffer + ptr, "\x12\x00\x00\x00", 4);
ptr += 4;
memcpy(pBuffer + ptr, originalFmt.WaveFormatExPtr(), sizeof(WAVEFORMATEX));
ptr += sizeof(WAVEFORMATEX);
memcpy(pBuffer + ptr, "data", 4);
ptr += 4;
memcpy(pBuffer + ptr, &sSize, 4);
ptr += 4;
// read the data into the buffer
pIstream->Read(pBuffer + ptr, sSize, &bytesRead);
2024-05-17 22:53:40 +08:00
2024-12-29 18:09:35 +08:00
ret = std::move(datas);
}();
2024-05-17 22:53:40 +08:00
return ret;
}
std::vector<std::wstring> _List(const wchar_t *token)
{
std::vector<std::wstring> ret;
2024-12-29 18:09:35 +08:00
[&]()
2024-05-17 22:53:40 +08:00
{
2024-12-29 18:09:35 +08:00
CO_INIT co;
CHECK_FAILURE_NORET(co);
CComPtr<ISpVoice> pSpVoice = NULL;
CComPtr<IEnumSpObjectTokens> pSpEnumTokens = NULL;
CHECK_FAILURE_NORET(CoCreateInstance(CLSID_SpVoice, NULL, CLSCTX_ALL, IID_ISpVoice, (void **)&pSpVoice));
CHECK_FAILURE_NORET(SpEnumTokens(token, NULL, NULL, &pSpEnumTokens));
2024-05-17 22:53:40 +08:00
ULONG ulTokensNumber = 0;
pSpEnumTokens->GetCount(&ulTokensNumber);
2024-12-29 15:35:27 +08:00
CComPtr<ISpObjectToken> m_pISpObjectToken;
2024-05-17 22:53:40 +08:00
for (ULONG i = 0; i < ulTokensNumber; i++)
{
pSpEnumTokens->Item(i, &m_pISpObjectToken);
2024-12-29 18:09:35 +08:00
CComHeapPtr<WCHAR> pszVoiceId;
CComHeapPtr<WCHAR> pszVoiceName;
2024-05-17 22:53:40 +08:00
if (SUCCEEDED(m_pISpObjectToken->GetId(&pszVoiceId)))
{
if (SUCCEEDED(m_pISpObjectToken->GetStringValue(NULL, &pszVoiceName)))
{
ret.emplace_back(pszVoiceName);
}
}
}
2024-12-29 18:09:35 +08:00
}();
2024-05-17 22:53:40 +08:00
return ret;
}