Textractor_test/GUI/host/textthread.cc

66 lines
1.7 KiB
C++
Raw Normal View History

// textthread.cc
// 8/24/2013 jichi
// Branch IHF/TextThread.cpp, rev 133
#include "textthread.h"
2018-09-21 10:32:47 +08:00
#include "host.h"
2018-08-23 23:53:23 +08:00
#include "const.h"
2018-10-09 13:46:11 +08:00
#include <regex>
#include <algorithm>
2018-11-02 03:03:30 +08:00
TextThread::TextThread(ThreadParam tp, HookParam hp, std::wstring name) : handle(threadCounter++), name(name), tp(tp), hp(hp) {}
2018-07-19 04:18:43 +08:00
TextThread::~TextThread()
{
SetEvent(deletionEvent);
flushThread.join();
CloseHandle(deletionEvent);
2018-07-19 04:18:43 +08:00
}
2018-10-08 12:26:43 +08:00
std::wstring TextThread::GetStorage()
2018-07-26 12:48:18 +08:00
{
2018-10-31 08:50:50 +08:00
LOCK(threadMutex);
2018-07-26 12:48:18 +08:00
return storage;
}
2018-08-26 04:02:16 +08:00
void TextThread::Flush()
{
std::wstring sentence;
2018-05-25 16:34:40 +08:00
{
2018-10-31 08:50:50 +08:00
LOCK(threadMutex);
if (buffer.empty()) return;
2018-10-09 14:09:52 +08:00
if (buffer.size() < maxBufferSize && GetTickCount() - timestamp < flushDelay) return;
sentence = buffer;
2018-08-29 05:21:20 +08:00
buffer.clear();
bool hasRepetition = false;
for (std::wsmatch results; std::regex_search(sentence, results, std::wregex(L"([^\\x00]{6,})\\1\\1")); hasRepetition = true) sentence = results[1];
if (hasRepetition) repeatingChars = std::unordered_set<wchar_t>(sentence.begin(), sentence.end());
else repeatingChars.clear();
2018-08-03 13:48:57 +08:00
}
2018-07-21 05:21:35 +08:00
AddSentence(sentence);
}
2018-05-25 16:34:40 +08:00
void TextThread::AddSentence(std::wstring sentence)
{
2018-08-29 05:21:20 +08:00
// Dispatch to extensions occurs here. Don't hold mutex! Extensions might take a while!
2018-10-08 12:26:43 +08:00
if (Output(this, sentence))
{
2018-10-31 08:50:50 +08:00
LOCK(threadMutex);
2018-10-08 12:26:43 +08:00
storage += sentence;
}
}
2018-09-02 01:56:45 +08:00
void TextThread::AddText(const BYTE* data, int len)
{
2018-10-31 08:50:50 +08:00
if (len < 0) return;
LOCK(threadMutex);
buffer += hp.type & USING_UNICODE
? std::wstring((wchar_t*)data, len / 2)
2018-11-02 09:59:13 +08:00
: StringToWideString(std::string((char*)data, len), hp.codepage != 0 ? hp.codepage : DEFAULT_CODEPAGE);
if (std::all_of(buffer.begin(), buffer.end(), [&](wchar_t c) { return repeatingChars.count(c) > 0; })) buffer.clear();
timestamp = GetTickCount();
}
// EOF