mirror of
https://github.com/Artikash/Textractor.git
synced 2024-12-24 01:14:12 +08:00
66 lines
1.7 KiB
C++
66 lines
1.7 KiB
C++
// textthread.cc
|
|
// 8/24/2013 jichi
|
|
// Branch IHF/TextThread.cpp, rev 133
|
|
|
|
#include "textthread.h"
|
|
#include "host.h"
|
|
#include "const.h"
|
|
#include <regex>
|
|
#include <algorithm>
|
|
|
|
TextThread::TextThread(ThreadParam tp) : handle(threadCounter++), name(Host::GetHookName(tp.pid, tp.hook)), tp(tp), hp(Host::GetHookParam(tp)) {}
|
|
|
|
TextThread::~TextThread()
|
|
{
|
|
SetEvent(deletionEvent);
|
|
flushThread.join();
|
|
CloseHandle(deletionEvent);
|
|
}
|
|
|
|
std::wstring TextThread::GetStorage()
|
|
{
|
|
LOCK(threadMutex);
|
|
return storage;
|
|
}
|
|
|
|
void TextThread::Flush()
|
|
{
|
|
std::wstring sentence;
|
|
{
|
|
LOCK(threadMutex);
|
|
if (buffer.empty()) return;
|
|
if (buffer.size() < maxBufferSize && GetTickCount() - timestamp < flushDelay) return;
|
|
sentence = buffer;
|
|
buffer.clear();
|
|
|
|
bool hasRepetition = false;
|
|
for (std::wsmatch results; std::regex_search(sentence, results, std::wregex(L"([^\\x00]{6,})\\1\\1")); hasRepetition = true) sentence = results[1];
|
|
if (hasRepetition) repeatingChars = std::unordered_set<wchar_t>(sentence.begin(), sentence.end());
|
|
else repeatingChars.clear();
|
|
}
|
|
AddSentence(sentence);
|
|
}
|
|
|
|
void TextThread::AddSentence(std::wstring sentence)
|
|
{
|
|
// Dispatch to extensions occurs here. Don't hold mutex! Extensions might take a while!
|
|
if (Output(this, sentence))
|
|
{
|
|
LOCK(threadMutex);
|
|
storage += sentence;
|
|
}
|
|
}
|
|
|
|
void TextThread::AddText(const BYTE* data, int len)
|
|
{
|
|
if (len < 0) return;
|
|
LOCK(threadMutex);
|
|
buffer += hp.type & USING_UNICODE
|
|
? std::wstring((wchar_t*)data, len / 2)
|
|
: StringToWideString(std::string((char*)data, len), hp.codepage);
|
|
if (std::all_of(buffer.begin(), buffer.end(), [&](wchar_t c) { return repeatingChars.count(c) > 0; })) buffer.clear();
|
|
timestamp = GetTickCount();
|
|
}
|
|
|
|
// EOF
|